File size: 716 Bytes
85c1145
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
from typing import Sequence
import numpy as np


class Vectorizer:
    def __init__(self, model) -> None:
        """Initialize the vectorizer with a pre-trained embedding model.
        Args:
        model: The pre-trained embedding model to use for transforming
        prompts.
        """
        
        self.model = model

    def transform(self, prompts: Sequence[str]) -> np.ndarray:
        
        """Transform texts into numerical vectors using the specified
        model.
        Args:
        prompts: The sequence of raw corpus prompts. Returns:
        Vectorized
        prompts as a numpy array."""
        vectorized = self.model.encode(prompts, show_progress_bar=True)
        return vectorized