You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

629 lines
20 KiB

  1. <!doctype html>
  2. <html lang="en" class="no-js">
  3. <head>
  4. <meta charset="utf-8">
  5. <meta name="viewport" content="width=device-width,initial-scale=1">
  6. <meta name="description" content="A Text Annotation tool for Humans">
  7. <link rel="canonical" href="https://doccano.github.io/doccano/">
  8. <meta name="author" content="Hiroki Nakayama">
  9. <link rel="shortcut icon" href="assets/images/favicon.png">
  10. <meta name="generator" content="mkdocs-1.1.2, mkdocs-material-6.1.0">
  11. <title>doccano</title>
  12. <link rel="stylesheet" href="assets/stylesheets/main.bc7e593a.min.css">
  13. <link rel="stylesheet" href="assets/stylesheets/palette.ab28b872.min.css">
  14. <meta name="theme-color" content="#00bdd6">
  15. <link href="https://fonts.gstatic.com" rel="preconnect" crossorigin>
  16. <link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Roboto:300,400,400i,700%7CRoboto+Mono&display=fallback">
  17. <style>body,input{font-family:"Roboto",-apple-system,BlinkMacSystemFont,Helvetica,Arial,sans-serif}code,kbd,pre{font-family:"Roboto Mono",SFMono-Regular,Consolas,Menlo,monospace}</style>
  18. </head>
  19. <body dir="ltr" data-md-color-scheme="" data-md-color-primary="cyan" data-md-color-accent="cyan">
  20. <input class="md-toggle" data-md-toggle="drawer" type="checkbox" id="__drawer" autocomplete="off">
  21. <input class="md-toggle" data-md-toggle="search" type="checkbox" id="__search" autocomplete="off">
  22. <label class="md-overlay" for="__drawer"></label>
  23. <div data-md-component="skip">
  24. <a href="#get-started-with-doccano" class="md-skip">
  25. Skip to content
  26. </a>
  27. </div>
  28. <div data-md-component="announce">
  29. </div>
  30. <header class="md-header" data-md-component="header">
  31. <nav class="md-header-nav md-grid" aria-label="Header">
  32. <a href="https://doccano.github.io/doccano/" title="doccano" class="md-header-nav__button md-logo" aria-label="doccano">
  33. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M12 8a3 3 0 003-3 3 3 0 00-3-3 3 3 0 00-3 3 3 3 0 003 3m0 3.54C9.64 9.35 6.5 8 3 8v11c3.5 0 6.64 1.35 9 3.54 2.36-2.19 5.5-3.54 9-3.54V8c-3.5 0-6.64 1.35-9 3.54z"/></svg>
  34. </a>
  35. <label class="md-header-nav__button md-icon" for="__drawer">
  36. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M3 6h18v2H3V6m0 5h18v2H3v-2m0 5h18v2H3v-2z"/></svg>
  37. </label>
  38. <div class="md-header-nav__title" data-md-component="header-title">
  39. <div class="md-header-nav__ellipsis">
  40. <span class="md-header-nav__topic md-ellipsis">
  41. doccano
  42. </span>
  43. <span class="md-header-nav__topic md-ellipsis">
  44. Get started
  45. </span>
  46. </div>
  47. </div>
  48. <div class="md-header-nav__source">
  49. <a href="https://github.com/doccano/doccano/" title="Go to repository" class="md-source">
  50. <div class="md-source__icon md-icon">
  51. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 448 512"><path d="M439.55 236.05L244 40.45a28.87 28.87 0 00-40.81 0l-40.66 40.63 51.52 51.52c27.06-9.14 52.68 16.77 43.39 43.68l49.66 49.66c34.23-11.8 61.18 31 35.47 56.69-26.49 26.49-70.21-2.87-56-37.34L240.22 199v121.85c25.3 12.54 22.26 41.85 9.08 55a34.34 34.34 0 01-48.55 0c-17.57-17.6-11.07-46.91 11.25-56v-123c-20.8-8.51-24.6-30.74-18.64-45L142.57 101 8.45 235.14a28.86 28.86 0 000 40.81l195.61 195.6a28.86 28.86 0 0040.8 0l194.69-194.69a28.86 28.86 0 000-40.81z"/></svg>
  52. </div>
  53. <div class="md-source__repository">
  54. doccano/doccano
  55. </div>
  56. </a>
  57. </div>
  58. </nav>
  59. </header>
  60. <div class="md-container" data-md-component="container">
  61. <main class="md-main" data-md-component="main">
  62. <div class="md-main__inner md-grid">
  63. <div class="md-sidebar md-sidebar--primary" data-md-component="navigation">
  64. <div class="md-sidebar__scrollwrap">
  65. <div class="md-sidebar__inner">
  66. <nav class="md-nav md-nav--primary" aria-label="Navigation" data-md-level="0">
  67. <label class="md-nav__title" for="__drawer">
  68. <a href="https://doccano.github.io/doccano/" title="doccano" class="md-nav__button md-logo" aria-label="doccano">
  69. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M12 8a3 3 0 003-3 3 3 0 00-3-3 3 3 0 00-3 3 3 3 0 003 3m0 3.54C9.64 9.35 6.5 8 3 8v11c3.5 0 6.64 1.35 9 3.54 2.36-2.19 5.5-3.54 9-3.54V8c-3.5 0-6.64 1.35-9 3.54z"/></svg>
  70. </a>
  71. doccano
  72. </label>
  73. <div class="md-nav__source">
  74. <a href="https://github.com/doccano/doccano/" title="Go to repository" class="md-source">
  75. <div class="md-source__icon md-icon">
  76. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 448 512"><path d="M439.55 236.05L244 40.45a28.87 28.87 0 00-40.81 0l-40.66 40.63 51.52 51.52c27.06-9.14 52.68 16.77 43.39 43.68l49.66 49.66c34.23-11.8 61.18 31 35.47 56.69-26.49 26.49-70.21-2.87-56-37.34L240.22 199v121.85c25.3 12.54 22.26 41.85 9.08 55a34.34 34.34 0 01-48.55 0c-17.57-17.6-11.07-46.91 11.25-56v-123c-20.8-8.51-24.6-30.74-18.64-45L142.57 101 8.45 235.14a28.86 28.86 0 000 40.81l195.61 195.6a28.86 28.86 0 0040.8 0l194.69-194.69a28.86 28.86 0 000-40.81z"/></svg>
  77. </div>
  78. <div class="md-source__repository">
  79. doccano/doccano
  80. </div>
  81. </a>
  82. </div>
  83. <ul class="md-nav__list" data-md-scrollfix>
  84. <li class="md-nav__item md-nav__item--active">
  85. <input class="md-nav__toggle md-toggle" data-md-toggle="toc" type="checkbox" id="__toc">
  86. <label class="md-nav__link md-nav__link--active" for="__toc">
  87. Get started
  88. <span class="md-nav__icon md-icon"></span>
  89. </label>
  90. <a href="." class="md-nav__link md-nav__link--active">
  91. Get started
  92. </a>
  93. <nav class="md-nav md-nav--secondary" aria-label="Table of contents">
  94. <label class="md-nav__title" for="__toc">
  95. <span class="md-nav__icon md-icon"></span>
  96. Table of contents
  97. </label>
  98. <ul class="md-nav__list" data-md-scrollfix>
  99. <li class="md-nav__item">
  100. <a href="#what-is-doccano" class="md-nav__link">
  101. What is doccano?
  102. </a>
  103. </li>
  104. <li class="md-nav__item">
  105. <a href="#doccano-labeling-workflow" class="md-nav__link">
  106. Doccano labeling workflow
  107. </a>
  108. </li>
  109. <li class="md-nav__item">
  110. <a href="#quickstart" class="md-nav__link">
  111. Quickstart
  112. </a>
  113. </li>
  114. <li class="md-nav__item">
  115. <a href="#architecture" class="md-nav__link">
  116. Architecture
  117. </a>
  118. </li>
  119. <li class="md-nav__item">
  120. <a href="#contact" class="md-nav__link">
  121. Contact
  122. </a>
  123. </li>
  124. </ul>
  125. </nav>
  126. </li>
  127. <li class="md-nav__item">
  128. <a href="install_and_upgrade_doccano/" class="md-nav__link">
  129. Install and upgrade doccano
  130. </a>
  131. </li>
  132. <li class="md-nav__item">
  133. <a href="tutorial/" class="md-nav__link">
  134. Tutorial
  135. </a>
  136. </li>
  137. <li class="md-nav__item">
  138. <a href="setup_cloud_storage/" class="md-nav__link">
  139. Setup cloud storage
  140. </a>
  141. </li>
  142. <li class="md-nav__item md-nav__item--nested">
  143. <input class="md-nav__toggle md-toggle" data-md-toggle="nav-5" type="checkbox" id="nav-5">
  144. <label class="md-nav__link" for="nav-5">
  145. Advanced
  146. <span class="md-nav__icon md-icon"></span>
  147. </label>
  148. <nav class="md-nav" aria-label="Advanced" data-md-level="1">
  149. <label class="md-nav__title" for="nav-5">
  150. <span class="md-nav__icon md-icon"></span>
  151. Advanced
  152. </label>
  153. <ul class="md-nav__list" data-md-scrollfix>
  154. <li class="md-nav__item">
  155. <a href="advanced/aws_https_settings/" class="md-nav__link">
  156. AWS HTTPS settings
  157. </a>
  158. </li>
  159. <li class="md-nav__item">
  160. <a href="advanced/oauth2_settings/" class="md-nav__link">
  161. OAuth2 settings
  162. </a>
  163. </li>
  164. <li class="md-nav__item">
  165. <a href="advanced/auto_labelling_config/" class="md-nav__link">
  166. Auto labeling settings
  167. </a>
  168. </li>
  169. </ul>
  170. </nav>
  171. </li>
  172. <li class="md-nav__item">
  173. <a href="developer_guide/" class="md-nav__link">
  174. Developer guide
  175. </a>
  176. </li>
  177. <li class="md-nav__item">
  178. <a href="faq/" class="md-nav__link">
  179. FAQ
  180. </a>
  181. </li>
  182. <li class="md-nav__item">
  183. <a href="CODE_OF_CONDUCT/" class="md-nav__link">
  184. Code of conduct
  185. </a>
  186. </li>
  187. <li class="md-nav__item">
  188. <a href="roadmap/" class="md-nav__link">
  189. Roadmap
  190. </a>
  191. </li>
  192. </ul>
  193. </nav>
  194. </div>
  195. </div>
  196. </div>
  197. <div class="md-sidebar md-sidebar--secondary" data-md-component="toc">
  198. <div class="md-sidebar__scrollwrap">
  199. <div class="md-sidebar__inner">
  200. <nav class="md-nav md-nav--secondary" aria-label="Table of contents">
  201. <label class="md-nav__title" for="__toc">
  202. <span class="md-nav__icon md-icon"></span>
  203. Table of contents
  204. </label>
  205. <ul class="md-nav__list" data-md-scrollfix>
  206. <li class="md-nav__item">
  207. <a href="#what-is-doccano" class="md-nav__link">
  208. What is doccano?
  209. </a>
  210. </li>
  211. <li class="md-nav__item">
  212. <a href="#doccano-labeling-workflow" class="md-nav__link">
  213. Doccano labeling workflow
  214. </a>
  215. </li>
  216. <li class="md-nav__item">
  217. <a href="#quickstart" class="md-nav__link">
  218. Quickstart
  219. </a>
  220. </li>
  221. <li class="md-nav__item">
  222. <a href="#architecture" class="md-nav__link">
  223. Architecture
  224. </a>
  225. </li>
  226. <li class="md-nav__item">
  227. <a href="#contact" class="md-nav__link">
  228. Contact
  229. </a>
  230. </li>
  231. </ul>
  232. </nav>
  233. </div>
  234. </div>
  235. </div>
  236. <div class="md-content">
  237. <article class="md-content__inner md-typeset">
  238. <a href="https://github.com/doccano/doccano/edit/master/docs/index.md" title="Edit this page" class="md-content__button md-icon">
  239. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M20.71 7.04c.39-.39.39-1.04 0-1.41l-2.34-2.34c-.37-.39-1.02-.39-1.41 0l-1.84 1.83 3.75 3.75M3 17.25V21h3.75L17.81 9.93l-3.75-3.75L3 17.25z"/></svg>
  240. </a>
  241. <h1 id="get-started-with-doccano">Get started with doccano</h1>
  242. <h2 id="what-is-doccano">What is doccano?</h2>
  243. <p><strong>doccano</strong> is an open-source data labeling tool for machine learning practitioners. You can use doccano to perform different types of labeling tasks with many data formats. To see what doccano can do, try the <a href="http://doccano.herokuapp.com">doccano demo</a>.</p>
  244. <p><img alt="Demo image" src="https://raw.githubusercontent.com/doccano/doccano/master/docs/images/demo/demo.gif" /></p>
  245. <p>You can also integrate doccano with your script via the doccano REST APIs. By using the doccano APIs, you can label your data by using some machine learning model.</p>
  246. <h2 id="doccano-labeling-workflow">Doccano labeling workflow</h2>
  247. <p>To complete a labeling project with doccano:</p>
  248. <ol>
  249. <li>Install doccano.</li>
  250. <li>Run doccano.</li>
  251. <li>Set up the labeling project. Select the type of labeling project and configure project settings.</li>
  252. <li>Import your dataset. You can also import labeled datasets.</li>
  253. <li>Add users to the project.</li>
  254. <li>Define the annotation guideline.</li>
  255. <li>Start labeling the data.</li>
  256. <li>Export the labeled dataset.</li>
  257. </ol>
  258. <h2 id="quickstart">Quickstart</h2>
  259. <ol>
  260. <li>
  261. <p>Install doccano with pip (Python 3.8+):</p>
  262. <p><code>bash
  263. pip install doccano</code></p>
  264. </li>
  265. <li>
  266. <p>Run doccano:</p>
  267. <pre><code> doccano init
  268. doccano createuser
  269. doccano webserver
  270. # In another terminal, run the command:
  271. doccano task
  272. </code></pre>
  273. </li>
  274. <li>
  275. <p>Open the doccano UI at <a href="http://localhost:8000/auth">http://localhost:8000/auth</a>.</p>
  276. </li>
  277. <li>
  278. <p>Sign in with the username and password created by <code>doccano createuser</code>.</p>
  279. <p>The default is <strong>username:</strong> admin, <strong>password:</strong> password.</p>
  280. </li>
  281. <li>
  282. <p>Change the default admin password at <a href="http://localhost:8000/admin/password_change/">http://localhost:8000/admin/password_change/</a>.</p>
  283. </li>
  284. <li>Return to the doccano UI at <a href="http://localhost:8000/projects?">http://localhost:8000/projects?</a>. </li>
  285. <li>Create a project for labeling data. Click <strong>Create</strong>, select a project type, and fill out project details.</li>
  286. <li>Import a dataset. Go to the <strong>Dataset</strong> page and click <strong>Actions</strong> &gt; <strong>Import Dataset</strong> and import the dataset you want to use.</li>
  287. <li>Click <strong>Annotate</strong> and label the data.</li>
  288. <li>When you're finished, export the labeled dataset. Go to the <strong>Dataset</strong> page and click <strong>Actions</strong> &gt; <strong>Export dataset</strong>.</li>
  289. </ol>
  290. <h2 id="architecture">Architecture</h2>
  291. <p>You can customize doccano to suit your needs. The architecture of doccano consists of two parts: backend and frontend.</p>
  292. <table>
  293. <thead>
  294. <tr>
  295. <th>Module</th>
  296. <th>Technology</th>
  297. <th>Description</th>
  298. </tr>
  299. </thead>
  300. <tbody>
  301. <tr>
  302. <td><a href="https://github.com/doccano/doccano/tree/master/backend">doccano backend</a></td>
  303. <td>Python, <a href="https://www.djangoproject.com/">Django</a>, and <a href="https://www.django-rest-framework.org/">Django Rest Framework</a></td>
  304. <td>Perform data labeling via REST APIs.</td>
  305. </tr>
  306. <tr>
  307. <td><a href="https://github.com/doccano/doccano/tree/master/frontend">doccano frontend</a></td>
  308. <td>Javascript web app using <a href="https://vuejs.org/">Vue.js</a> and <a href="https://nuxtjs.org/">Nuxt.js</a></td>
  309. <td>Perform data labeling in a user interface.</td>
  310. </tr>
  311. </tbody>
  312. </table>
  313. <h2 id="contact">Contact</h2>
  314. <p>If you get stuck, check the <a href="faq/">FAQ</a>.</p>
  315. <p>For help and feedback, feel free to contact <a href="https://github.com/Hironsan">the author</a>.</p>
  316. </article>
  317. </div>
  318. </div>
  319. </main>
  320. <footer class="md-footer">
  321. <div class="md-footer-nav">
  322. <nav class="md-footer-nav__inner md-grid" aria-label="Footer">
  323. <a href="install_and_upgrade_doccano/" class="md-footer-nav__link md-footer-nav__link--next" rel="next">
  324. <div class="md-footer-nav__title">
  325. <div class="md-ellipsis">
  326. <span class="md-footer-nav__direction">
  327. Next
  328. </span>
  329. Install and upgrade doccano
  330. </div>
  331. </div>
  332. <div class="md-footer-nav__button md-icon">
  333. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M4 11v2h12l-5.5 5.5 1.42 1.42L19.84 12l-7.92-7.92L10.5 5.5 16 11H4z"/></svg>
  334. </div>
  335. </a>
  336. </nav>
  337. </div>
  338. <div class="md-footer-meta md-typeset">
  339. <div class="md-footer-meta__inner md-grid">
  340. <div class="md-footer-copyright">
  341. <div class="md-footer-copyright__highlight">
  342. Copyright &copy; 2018 - 2019 Hiroki Nakayama
  343. </div>
  344. Made with
  345. <a href="https://squidfunk.github.io/mkdocs-material/" target="_blank" rel="noopener">
  346. Material for MkDocs
  347. </a>
  348. </div>
  349. <div class="md-footer-social">
  350. <a href="https://github.com/Hironsan" target="_blank" rel="noopener" title="github.com" class="md-footer-social__link">
  351. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 496 512"><path d="M165.9 397.4c0 2-2.3 3.6-5.2 3.6-3.3.3-5.6-1.3-5.6-3.6 0-2 2.3-3.6 5.2-3.6 3-.3 5.6 1.3 5.6 3.6zm-31.1-4.5c-.7 2 1.3 4.3 4.3 4.9 2.6 1 5.6 0 6.2-2s-1.3-4.3-4.3-5.2c-2.6-.7-5.5.3-6.2 2.3zm44.2-1.7c-2.9.7-4.9 2.6-4.6 4.9.3 2 2.9 3.3 5.9 2.6 2.9-.7 4.9-2.6 4.6-4.6-.3-1.9-3-3.2-5.9-2.9zM244.8 8C106.1 8 0 113.3 0 252c0 110.9 69.8 205.8 169.5 239.2 12.8 2.3 17.3-5.6 17.3-12.1 0-6.2-.3-40.4-.3-61.4 0 0-70 15-84.7-29.8 0 0-11.4-29.1-27.8-36.6 0 0-22.9-15.7 1.6-15.4 0 0 24.9 2 38.6 25.8 21.9 38.6 58.6 27.5 72.9 20.9 2.3-16 8.8-27.1 16-33.7-55.9-6.2-112.3-14.3-112.3-110.5 0-27.5 7.6-41.3 23.6-58.9-2.6-6.5-11.1-33.3 2.6-67.9 20.9-6.5 69 27 69 27 20-5.6 41.5-8.5 62.8-8.5s42.8 2.9 62.8 8.5c0 0 48.1-33.6 69-27 13.7 34.7 5.2 61.4 2.6 67.9 16 17.7 25.8 31.5 25.8 58.9 0 96.5-58.9 104.2-114.8 110.5 9.2 7.9 17 22.9 17 46.4 0 33.7-.3 75.4-.3 83.6 0 6.5 4.6 14.4 17.3 12.1C428.2 457.8 496 362.9 496 252 496 113.3 383.5 8 244.8 8zM97.2 352.9c-1.3 1-1 3.3.7 5.2 1.6 1.6 3.9 2.3 5.2 1 1.3-1 1-3.3-.7-5.2-1.6-1.6-3.9-2.3-5.2-1zm-10.8-8.1c-.7 1.3.3 2.9 2.3 3.9 1.6 1 3.6.7 4.3-.7.7-1.3-.3-2.9-2.3-3.9-2-.6-3.6-.3-4.3.7zm32.4 35.6c-1.6 1.3-1 4.3 1.3 6.2 2.3 2.3 5.2 2.6 6.5 1 1.3-1.3.7-4.3-1.3-6.2-2.2-2.3-5.2-2.6-6.5-1zm-11.4-14.7c-1.6 1-1.6 3.6 0 5.9 1.6 2.3 4.3 3.3 5.6 2.3 1.6-1.3 1.6-3.9 0-6.2-1.4-2.3-4-3.3-5.6-2z"/></svg>
  352. </a>
  353. <a href="https://twitter.com/Hironsan13" target="_blank" rel="noopener" title="twitter.com" class="md-footer-social__link">
  354. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 512 512"><path d="M459.37 151.716c.325 4.548.325 9.097.325 13.645 0 138.72-105.583 298.558-298.558 298.558-59.452 0-114.68-17.219-161.137-47.106 8.447.974 16.568 1.299 25.34 1.299 49.055 0 94.213-16.568 130.274-44.832-46.132-.975-84.792-31.188-98.112-72.772 6.498.974 12.995 1.624 19.818 1.624 9.421 0 18.843-1.3 27.614-3.573-48.081-9.747-84.143-51.98-84.143-102.985v-1.299c13.969 7.797 30.214 12.67 47.431 13.319-28.264-18.843-46.781-51.005-46.781-87.391 0-19.492 5.197-37.36 14.294-52.954 51.655 63.675 129.3 105.258 216.365 109.807-1.624-7.797-2.599-15.918-2.599-24.04 0-57.828 46.782-104.934 104.934-104.934 30.213 0 57.502 12.67 76.67 33.137 23.715-4.548 46.456-13.32 66.599-25.34-7.798 24.366-24.366 44.833-46.132 57.827 21.117-2.273 41.584-8.122 60.426-16.243-14.292 20.791-32.161 39.308-52.628 54.253z"/></svg>
  355. </a>
  356. </div>
  357. </div>
  358. </div>
  359. </footer>
  360. </div>
  361. <script src="assets/javascripts/vendor.6a3d08fc.min.js"></script>
  362. <script src="assets/javascripts/bundle.71201edf.min.js"></script><script id="__lang" type="application/json">{"clipboard.copy": "Copy to clipboard", "clipboard.copied": "Copied to clipboard", "search.config.lang": "en", "search.config.pipeline": "trimmer, stopWordFilter", "search.config.separator": "[\\s\\-]+", "search.placeholder": "Search", "search.result.placeholder": "Type to start searching", "search.result.none": "No matching documents", "search.result.one": "1 matching document", "search.result.other": "# matching documents", "search.result.more.one": "1 more on this page", "search.result.more.other": "# more on this page", "search.result.term.missing": "Missing"}</script>
  363. <script>
  364. app = initialize({
  365. base: ".",
  366. features: [],
  367. search: Object.assign({
  368. worker: "assets/javascripts/worker/search.4ac00218.min.js"
  369. }, typeof search !== "undefined" && search)
  370. })
  371. </script>
  372. </body>
  373. </html>