File size: 653 Bytes
268c7f9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
from typing import Sequence

import numpy as np


class Vectorizer:
    def __init__(self, model) -> None:
        """Initialize the vectorizer with a pre-trained embedding model.
        Args:
        model: The pre-trained embedding model to use for transforming
        prompts.
        """
        self.model = model

    def transform(self, prompts: Sequence[str]) -> np.ndarray:
        """Transform texts into numerical vectors using the specified
        model.
        Args:
        prompts: The sequence of raw corpus prompts. Returns:
        Vectorized
        prompts as a numpy array.
        """
        return self.model.encode(prompts)