from aevyra_verdict import Dataset
# JSONL — auto-detect format (default)
dataset = Dataset.from_jsonl("data.jsonl")
# JSONL — explicit format
dataset = Dataset.from_jsonl("sharegpt_data.jsonl", format="sharegpt")
dataset = Dataset.from_jsonl("alpaca_data.jsonl", format="alpaca")
# Arbitrary JSONL with custom field names
dataset = Dataset.from_jsonl("data.jsonl", input_field="question", output_field="answer")
dataset = Dataset.from_jsonl("data.jsonl", input_field="prompt", output_field=None) # label-free
# CSV — default column names (input, ideal)
dataset = Dataset.from_csv("data.csv")
# CSV — custom column names
dataset = Dataset.from_csv("data.csv", input_field="article", output_field="summary")
# CSV — label-free (no reference answers)
dataset = Dataset.from_csv("data.csv", output_field=None)
print(dataset.summary())
# {'name': 'data', 'num_conversations': 50, 'has_ideals': True, 'metadata_keys': ['category']}