File size: 265 Bytes
37c1830
 
 
 
 
 
 
1
2
3
4
5
6
7
8
import pandas as pd
from autorag.data.chunk import langchain_chunk


def chunk(raw_df: pd.DataFrame, method: str, lang: str = "en", **kwargs) -> pd.DataFrame:
	corpus_df = langchain_chunk(raw_df, chunk_method=method, add_file_name=lang, **kwargs)
	return corpus_df