You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 
 

99 lines
2.2 KiB

Generic_TextFile = """
├── 202104210943.txt
├── 202104210944.txt
└── 202104210945.txt
"""
Generic_ImageFile = """
├── 202104210943.png
├── 202104210944.png
└── 202104210945.png
"""
Generic_AudioFile = """
├── 202104210943.mp3
├── 202104210944.mp3
└── 202104210945.mp3
"""
Generic_TextLine = """
Terrible customer service.
Really great transaction.
Great price.
"""
Category_CSV = """
column_data,column_label
"Terrible customer service.","negative"
"Really great transaction.","positive"
"Great price.","positive"
"""
Category_fastText = """
__label__negative Terrible customer service.
__label__positive Really great transaction.
__label__positive Great price.
"""
Category_JSON = """
[
{
"column_data": "Terrible customer service.",
"column_label": ["negative"]
}
]
"""
Category_JSONL = """
{"column_data": "Terrible customer service.", "column_label": ["negative"]}
{"column_data": "Really great transaction.", "column_label": ["positive"]}
{"column_data": "Great price.", "column_label": ["positive"]}
"""
Text_CSV = """
column_data,column_label
"Hello!","こんにちは!"
"Good morning.","おはようございます。"
"See you.","さようなら。"
"""
Text_JSON = """
[
{
"text": "Hello!",
"labels": ["こんにちは!"]
}
]
"""
Text_JSONL = """
{"column_data": "Hello!", "column_label": ["こんにちは!"]}
{"column_data": "Good morning.", "column_label": ["おはようございます。"]}
{"column_data": "See you.", "column_label": ["さようなら。"]}
"""
Offset_JSONL = """
{"column_data": "EU rejects German call to boycott British lamb.", "column_label": [ [0, 2, "ORG"], ... ]}
{"column_data": "Peter Blackburn", "column_label": [ [0, 15, "PERSON"] ]}
{"column_data": "President Obama", "column_label": [ [10, 15, "PERSON"] ]}
"""
Offset_CoNLL = """
EU B-ORG
rejects O
German B-MISC
call O
to O
boycott O
British B-MISC
lamb O
. O
Peter B-PER
Blackburn I-PER
"""
IDSF_JSONL = """
{"text": "Find a flight from Memphis to Tacoma", "entities": [[0, 26, "City"], [30, 36, "City"]], "cats": ["flight"]}
{"text": "I want to know what airports are in Los Angeles", "entities": [[36, 47, "City"]], "cats": ["airport"]}
"""