You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 
 

83 lines
2.7 KiB

from django.db.models import Count, Manager
class LabelManager(Manager):
label_type_field = "label"
def calc_label_distribution(self, examples, members, labels):
"""Calculate label distribution.
Args:
examples: example queryset.
members: user queryset.
labels: label queryset.
Returns:
label distribution per user.
Examples:
>>> self.calc_label_distribution(examples, members, labels)
{'admin': {'positive': 10, 'negative': 5}}
"""
distribution = {member.username: {label.text: 0 for label in labels} for member in members}
items = (
self.filter(example_id__in=examples)
.values("user__username", f"{self.label_type_field}__text")
.annotate(count=Count(f"{self.label_type_field}__text"))
)
for item in items:
username = item["user__username"]
label = item[f"{self.label_type_field}__text"]
count = item["count"]
distribution[username][label] = count
return distribution
def get_labels(self, label, project):
if project.collaborative_annotation:
return self.filter(example=label.example)
else:
return self.filter(example=label.example, user=label.user)
def can_annotate(self, label, project) -> bool:
raise NotImplementedError("Please implement this method in the subclass")
def filter_annotatable_labels(self, labels, project):
return [label for label in labels if self.can_annotate(label, project)]
class CategoryManager(LabelManager):
def can_annotate(self, label, project) -> bool:
is_exclusive = project.single_class_classification
categories = self.get_labels(label, project)
if is_exclusive:
return not categories.exists()
else:
return not categories.filter(label=label.label).exists()
class SpanManager(LabelManager):
def can_annotate(self, label, project) -> bool:
overlapping = getattr(project, "allow_overlapping", False)
spans = self.get_labels(label, project)
if overlapping:
return True
for span in spans:
if span.is_overlapping(label):
return False
return True
class TextLabelManager(LabelManager):
def can_annotate(self, label, project) -> bool:
texts = self.get_labels(label, project)
for text in texts:
if text.is_same_text(label):
return False
return True
class RelationManager(LabelManager):
label_type_field = "type"
def can_annotate(self, label, project) -> bool:
return True