mirror of
https://github.com/holodata/sensai-dataset.git
synced 2025-03-15 20:10:32 +09:00
14 lines
373 B
Python
14 lines
373 B
Python
from datasets.features import ClassLabel, Features, Value
|
|
from datasets.load import load_dataset
|
|
|
|
|
|
def load_sensai_dataset():
|
|
dataset = load_dataset(
|
|
"holodata/sensai",
|
|
features=Features({
|
|
"body": Value("string"),
|
|
"toxic": ClassLabel(num_classes=2, names=['0', '1'])
|
|
}))
|
|
dataset = dataset['train']
|
|
return dataset
|