Datasets
Datasets
APIs
from datasets import load_dataset, Dataset
raw_dataset = load_dataset("json", data_files=json_file, split="train")
filtered_dataset = raw_dataset.select(range(i,i+20))
raw_dataset = Dataset.from_pandas(df)
df = raw_dataset.to_pandas()
comment_dataset = raw_dataset.remove_columns(columns_to_remove)