jeffrey
init commit
37c1830
raw
history blame contribute delete
265 Bytes
import pandas as pd
from autorag.data.chunk import langchain_chunk
def chunk(raw_df: pd.DataFrame, method: str, lang: str = "en", **kwargs) -> pd.DataFrame:
corpus_df = langchain_chunk(raw_df, chunk_method=method, add_file_name=lang, **kwargs)
return corpus_df