mirror of https://github.com/doccano/doccano.git
pythonannotation-tooldatasetsactive-learningtext-annotationdatasetnatural-language-processingdata-labelingmachine-learning
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
99 lines
2.2 KiB
99 lines
2.2 KiB
Generic_TextFile = """
|
|
├── 202104210943.txt
|
|
├── 202104210944.txt
|
|
└── 202104210945.txt
|
|
"""
|
|
|
|
Generic_ImageFile = """
|
|
├── 202104210943.png
|
|
├── 202104210944.png
|
|
└── 202104210945.png
|
|
"""
|
|
|
|
Generic_AudioFile = """
|
|
├── 202104210943.mp3
|
|
├── 202104210944.mp3
|
|
└── 202104210945.mp3
|
|
"""
|
|
|
|
Generic_TextLine = """
|
|
Terrible customer service.
|
|
Really great transaction.
|
|
Great price.
|
|
"""
|
|
|
|
Category_CSV = """
|
|
column_data,column_label
|
|
"Terrible customer service.","negative"
|
|
"Really great transaction.","positive"
|
|
"Great price.","positive"
|
|
"""
|
|
|
|
Category_fastText = """
|
|
__label__negative Terrible customer service.
|
|
__label__positive Really great transaction.
|
|
__label__positive Great price.
|
|
"""
|
|
|
|
Category_JSON = """
|
|
[
|
|
{
|
|
"column_data": "Terrible customer service.",
|
|
"column_label": ["negative"]
|
|
}
|
|
]
|
|
"""
|
|
|
|
Category_JSONL = """
|
|
{"column_data": "Terrible customer service.", "column_label": ["negative"]}
|
|
{"column_data": "Really great transaction.", "column_label": ["positive"]}
|
|
{"column_data": "Great price.", "column_label": ["positive"]}
|
|
"""
|
|
|
|
Text_CSV = """
|
|
column_data,column_label
|
|
"Hello!","こんにちは!"
|
|
"Good morning.","おはようございます。"
|
|
"See you.","さようなら。"
|
|
"""
|
|
|
|
Text_JSON = """
|
|
[
|
|
{
|
|
"text": "Hello!",
|
|
"labels": ["こんにちは!"]
|
|
}
|
|
]
|
|
"""
|
|
|
|
Text_JSONL = """
|
|
{"column_data": "Hello!", "column_label": ["こんにちは!"]}
|
|
{"column_data": "Good morning.", "column_label": ["おはようございます。"]}
|
|
{"column_data": "See you.", "column_label": ["さようなら。"]}
|
|
"""
|
|
|
|
Offset_JSONL = """
|
|
{"column_data": "EU rejects German call to boycott British lamb.", "column_label": [ [0, 2, "ORG"], ... ]}
|
|
{"column_data": "Peter Blackburn", "column_label": [ [0, 15, "PERSON"] ]}
|
|
{"column_data": "President Obama", "column_label": [ [10, 15, "PERSON"] ]}
|
|
"""
|
|
|
|
Offset_CoNLL = """
|
|
EU B-ORG
|
|
rejects O
|
|
German B-MISC
|
|
call O
|
|
to O
|
|
boycott O
|
|
British B-MISC
|
|
lamb O
|
|
. O
|
|
|
|
Peter B-PER
|
|
Blackburn I-PER
|
|
"""
|
|
|
|
IDSF_JSONL = """
|
|
{"text": "Find a flight from Memphis to Tacoma", "entities": [[0, 26, "City"], [30, 36, "City"]], "cats": ["flight"]}
|
|
{"text": "I want to know what airports are in Los Angeles", "entities": [[36, 47, "City"]], "cats": ["airport"]}
|
|
"""
|