mirror of https://github.com/doccano/doccano.git
pythonannotation-tooldatasetsactive-learningtext-annotationdatasetnatural-language-processingdata-labelingmachine-learning
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
118 lines
2.9 KiB
118 lines
2.9 KiB
from typing import Any, Dict, Protocol, Tuple
|
|
|
|
from django.db import models
|
|
|
|
from examples.models import Comment, Example
|
|
from labels.models import BoundingBox, Category, Relation, Segmentation, Span, TextLabel
|
|
from projects.models import Project
|
|
|
|
DATA = "data"
|
|
|
|
|
|
class ExportedExampleManager(models.Manager):
|
|
def confirmed(self, project: Project, user=None):
|
|
if project.collaborative_annotation:
|
|
return self.filter(project=project).exclude(states=None)
|
|
else:
|
|
assert user is not None
|
|
return self.filter(project=project, states__confirmed_by=user)
|
|
|
|
|
|
class ExportedExample(Example):
|
|
objects = ExportedExampleManager()
|
|
|
|
def to_dict(self, is_text_project=True) -> Dict[str, Any]:
|
|
return {"id": self.id, DATA: self.text if is_text_project else self.upload_name, **self.meta}
|
|
|
|
class Meta:
|
|
proxy = True
|
|
|
|
|
|
class ExportedLabel(Protocol):
|
|
objects: models.Manager
|
|
|
|
def to_dict(self) -> Dict[str, Any]:
|
|
raise NotImplementedError("Please implement this method in the subclass.")
|
|
|
|
def to_string(self) -> str:
|
|
raise NotImplementedError("Please implement this method in the subclass.")
|
|
|
|
def to_tuple(self) -> Tuple:
|
|
raise NotImplementedError("Please implement this method in the subclass.")
|
|
|
|
|
|
class ExportedCategory(Category):
|
|
def to_string(self) -> str:
|
|
return self.label.text
|
|
|
|
class Meta:
|
|
proxy = True
|
|
|
|
|
|
class ExportedSpan(Span):
|
|
def to_dict(self):
|
|
return {
|
|
"id": self.id,
|
|
"label": self.label.text,
|
|
"start_offset": self.start_offset,
|
|
"end_offset": self.end_offset,
|
|
}
|
|
|
|
def to_tuple(self):
|
|
return self.start_offset, self.end_offset, self.label.text
|
|
|
|
class Meta:
|
|
proxy = True
|
|
|
|
|
|
class ExportedRelation(Relation):
|
|
def to_dict(self):
|
|
return {"id": self.id, "from_id": self.from_id.id, "to_id": self.to_id.id, "type": self.type.text}
|
|
|
|
class Meta:
|
|
proxy = True
|
|
|
|
|
|
class ExportedText(TextLabel):
|
|
def to_string(self) -> str:
|
|
return self.text
|
|
|
|
class Meta:
|
|
proxy = True
|
|
|
|
|
|
class ExportedComment(Comment):
|
|
def to_string(self) -> str:
|
|
return self.text
|
|
|
|
def to_dict(self):
|
|
return {"id": self.id, "comment": self.text}
|
|
|
|
class Meta:
|
|
proxy = True
|
|
|
|
|
|
class ExportedBoundingBox(BoundingBox):
|
|
def to_dict(self):
|
|
return {
|
|
"uuid": str(self.uuid),
|
|
"x": self.x,
|
|
"y": self.y,
|
|
"width": self.width,
|
|
"height": self.height,
|
|
"label": self.label.text,
|
|
}
|
|
|
|
def to_tuple(self):
|
|
return self.x, self.y, self.width, self.height
|
|
|
|
class Meta:
|
|
proxy = True
|
|
|
|
|
|
class ExportedSegmentation(Segmentation):
|
|
def to_dict(self):
|
|
return {"uuid": str(self.uuid), "points": self.points, "label": self.label.text}
|
|
|
|
class Meta:
|
|
proxy = True
|