Trial-OpenAI / utils /embedding_generation.py
AashitaK's picture
Update utils/embedding_generation.py
90aed10 verified
raw
history blame contribute delete
457 Bytes
import pandas as pd
from utils.openai_api import get_embedding
def compute_doc_embeddings(df: pd.DataFrame) -> dict[tuple[str, str], list[float]]:
"""
Create an embedding for each row in the dataframe using the OpenAI Embeddings API.
Return a dictionary that maps between each embedding vector and the index of the row that it corresponds to.
"""
return {
idx: get_embedding(r.description) for idx, r in df.iterrows()
}