Spaces:
Running
Running
File size: 265 Bytes
37c1830 |
1 2 3 4 5 6 7 8 |
import pandas as pd
from autorag.data.chunk import langchain_chunk
def chunk(raw_df: pd.DataFrame, method: str, lang: str = "en", **kwargs) -> pd.DataFrame:
corpus_df = langchain_chunk(raw_df, chunk_method=method, add_file_name=lang, **kwargs)
return corpus_df
|