You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

94 lines
2.0 KiB

3 years ago
3 years ago
  1. Generic_TextFile = """
  2. 202104210943.txt
  3. 202104210944.txt
  4. 202104210945.txt
  5. """
  6. Generic_ImageFile = """
  7. 202104210943.png
  8. 202104210944.png
  9. 202104210945.png
  10. """
  11. Generic_AudioFile = """
  12. 202104210943.mp3
  13. 202104210944.mp3
  14. 202104210945.mp3
  15. """
  16. Generic_TextLine = """
  17. Terrible customer service.
  18. Really great transaction.
  19. Great price.
  20. """
  21. Category_CSV = """
  22. column_data,column_label
  23. "Terrible customer service.","negative"
  24. "Really great transaction.","positive"
  25. "Great price.","positive"
  26. """
  27. Category_fastText = """
  28. __label__negative Terrible customer service.
  29. __label__positive Really great transaction.
  30. __label__positive Great price.
  31. """
  32. Category_JSON = """
  33. [
  34. {
  35. "column_data": "Terrible customer service.",
  36. "column_label": ["negative"]
  37. }
  38. ]
  39. """
  40. Category_JSONL = """
  41. {"column_data": "Terrible customer service.", "column_label": ["negative"]}
  42. {"column_data": "Really great transaction.", "column_label": ["positive"]}
  43. {"column_data": "Great price.", "column_label": ["positive"]}
  44. """
  45. Text_CSV = """
  46. column_data,column_label
  47. "Hello!","こんにちは!"
  48. "Good morning.","おはようございます。"
  49. "See you.","さようなら。"
  50. """
  51. Text_JSON = """
  52. [
  53. {
  54. "text": "Hello!",
  55. "labels": ["こんにちは!"]
  56. }
  57. ]
  58. """
  59. Text_JSONL = """
  60. {"column_data": "Hello!", "column_label": ["こんにちは!"]}
  61. {"column_data": "Good morning.", "column_label": ["おはようございます。"]}
  62. {"column_data": "See you.", "column_label": ["さようなら。"]}
  63. """
  64. Offset_JSONL = """
  65. {"column_data": "EU rejects German call to boycott British lamb.", "column_label": [ [0, 2, "ORG"], ... ]}
  66. {"column_data": "Peter Blackburn", "column_label": [ [0, 15, "PERSON"] ]}
  67. {"column_data": "President Obama", "column_label": [ [10, 15, "PERSON"] ]}
  68. """
  69. Offset_CoNLL = """
  70. EU B-ORG
  71. rejects O
  72. German B-MISC
  73. call O
  74. to O
  75. boycott O
  76. British B-MISC
  77. lamb O
  78. . O
  79. Peter B-PER
  80. Blackburn I-PER
  81. """