You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 
 

128 lines
4.9 KiB

import uuid
from django.contrib.auth.models import User
from django.core.exceptions import ValidationError
from django.db import models
from .managers import (
CategoryManager,
LabelManager,
RelationManager,
SpanManager,
TextLabelManager,
)
from examples.models import Example
from label_types.models import CategoryType, RelationType, SpanType
class Label(models.Model):
objects = LabelManager()
uuid = models.UUIDField(default=uuid.uuid4, unique=True)
prob = models.FloatField(default=0.0)
manual = models.BooleanField(default=False)
user = models.ForeignKey(User, on_delete=models.CASCADE)
created_at = models.DateTimeField(auto_now_add=True)
updated_at = models.DateTimeField(auto_now=True)
class Meta:
abstract = True
class Category(Label):
objects = CategoryManager()
example = models.ForeignKey(to=Example, on_delete=models.CASCADE, related_name="categories")
label = models.ForeignKey(to=CategoryType, on_delete=models.CASCADE)
class Meta:
unique_together = ("example", "user", "label")
class Span(Label):
objects = SpanManager()
example = models.ForeignKey(to=Example, on_delete=models.CASCADE, related_name="spans")
label = models.ForeignKey(to=SpanType, on_delete=models.CASCADE)
start_offset = models.IntegerField()
end_offset = models.IntegerField()
def __str__(self):
text = self.example.text[self.start_offset : self.end_offset]
return f"({text}, {self.start_offset}, {self.end_offset}, {self.label.text})"
def validate_unique(self, exclude=None):
allow_overlapping = getattr(self.example.project, "allow_overlapping", False)
is_collaborative = self.example.project.collaborative_annotation
if allow_overlapping:
super().validate_unique(exclude=exclude)
return
overlapping_span = (
Span.objects.exclude(id=self.id)
.filter(example=self.example)
.filter(
models.Q(start_offset__gte=self.start_offset, start_offset__lt=self.end_offset)
| models.Q(end_offset__gt=self.start_offset, end_offset__lte=self.end_offset)
| models.Q(start_offset__lte=self.start_offset, end_offset__gte=self.end_offset)
)
)
if is_collaborative:
if overlapping_span.exists():
raise ValidationError("This overlapping is not allowed in this project.")
else:
if overlapping_span.filter(user=self.user).exists():
raise ValidationError("This overlapping is not allowed in this project.")
def save(self, force_insert=False, force_update=False, using=None, update_fields=None):
self.full_clean()
super().save(force_insert, force_update, using, update_fields)
def is_overlapping(self, other: "Span"):
return (
(other.start_offset <= self.start_offset < other.end_offset)
or (other.start_offset < self.end_offset <= other.end_offset)
or (self.start_offset < other.start_offset and other.end_offset < self.end_offset)
)
class Meta:
constraints = [
models.CheckConstraint(check=models.Q(start_offset__gte=0), name="startOffset >= 0"),
models.CheckConstraint(check=models.Q(end_offset__gte=0), name="endOffset >= 0"),
models.CheckConstraint(check=models.Q(start_offset__lt=models.F("end_offset")), name="start < end"),
]
class TextLabel(Label):
objects = TextLabelManager()
example = models.ForeignKey(to=Example, on_delete=models.CASCADE, related_name="texts")
text = models.TextField()
def is_same_text(self, other: "TextLabel"):
return self.text == other.text
class Meta:
unique_together = ("example", "user", "text")
class Relation(Label):
objects = RelationManager()
from_id = models.ForeignKey(Span, on_delete=models.CASCADE, related_name="from_relations")
to_id = models.ForeignKey(Span, on_delete=models.CASCADE, related_name="to_relations")
type = models.ForeignKey(RelationType, on_delete=models.CASCADE)
example = models.ForeignKey(to=Example, on_delete=models.CASCADE, related_name="relations")
def __str__(self):
text = self.example.text
from_span = text[self.from_id.start_offset : self.from_id.end_offset]
to_span = text[self.to_id.start_offset : self.to_id.end_offset]
type_text = self.type.text
return f"{from_span} - ({type_text}) -> {to_span}"
def save(self, force_insert=False, force_update=False, using=None, update_fields=None):
self.full_clean()
super().save(force_insert, force_update, using, update_fields)
def clean(self):
same_example = self.from_id.example == self.to_id.example == self.example
if not same_example:
raise ValidationError("You need to label the same example.")
return super().clean()