You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 
 

157 lines
5.9 KiB

import json
import botocore.exceptions
import requests
from auto_labeling_pipeline.mappings import MappingTemplate
from auto_labeling_pipeline.menu import Options
from auto_labeling_pipeline.models import RequestModelFactory
from auto_labeling_pipeline.postprocessing import PostProcessor
from django.shortcuts import get_object_or_404
from django_drf_filepond.models import TemporaryUpload
from rest_framework import generics, status
from rest_framework.exceptions import ValidationError
from rest_framework.permissions import IsAuthenticated
from rest_framework.request import Request
from rest_framework.response import Response
from rest_framework.views import APIView
from api.models import Project
from members.permissions import IsInProjectOrAdmin, IsProjectAdmin
from .pipeline.execution import execute_pipeline, get_label_collection
from .exceptions import AWSTokenError, SampleDataException, TemplateMappingError, URLConnectionError
from .models import AutoLabelingConfig
from .serializers import AutoLabelingConfigSerializer
class TemplateListAPI(APIView):
permission_classes = [IsAuthenticated & IsProjectAdmin]
def get(self, request: Request, *args, **kwargs):
task_name = request.query_params.get('task_name')
options = Options.filter_by_task(task_name=task_name)
option_names = [o.name for o in options]
return Response(option_names, status=status.HTTP_200_OK)
class TemplateDetailAPI(APIView):
permission_classes = [IsAuthenticated & IsProjectAdmin]
def get(self, request, *args, **kwargs):
option = Options.find(option_name=self.kwargs['option_name'])
return Response(option.to_dict(), status=status.HTTP_200_OK)
class ConfigList(generics.ListCreateAPIView):
serializer_class = AutoLabelingConfigSerializer
pagination_class = None
permission_classes = [IsAuthenticated & IsProjectAdmin]
def get_queryset(self):
return AutoLabelingConfig.objects.filter(project=self.kwargs['project_id'])
def perform_create(self, serializer):
serializer.save(project_id=self.kwargs['project_id'])
class ConfigDetail(generics.RetrieveUpdateDestroyAPIView):
queryset = AutoLabelingConfig.objects.all()
serializer_class = AutoLabelingConfigSerializer
lookup_url_kwarg = 'config_id'
permission_classes = [IsAuthenticated & IsProjectAdmin]
class RestAPIRequestTesting(APIView):
permission_classes = [IsAuthenticated & IsProjectAdmin]
@property
def project(self):
return get_object_or_404(Project, pk=self.kwargs['project_id'])
def create_model(self):
model_name = self.request.data['model_name']
model_attrs = self.request.data['model_attrs']
try:
model = RequestModelFactory.create(model_name, model_attrs)
return model
except Exception:
model = RequestModelFactory.find(model_name)
schema = model.schema()
required_fields = ', '.join(schema['required']) if 'required' in schema else ''
raise ValidationError(
'The attributes does not match the model.'
'You need to correctly specify the required fields: {}'.format(required_fields)
)
def send_request(self, model, example):
try:
return model.send(example)
except requests.exceptions.ConnectionError:
raise URLConnectionError
except botocore.exceptions.ClientError:
raise AWSTokenError()
except Exception as e:
raise e
def prepare_example(self):
text = self.request.data['text']
if self.project.is_text_project:
return text
else:
tu = TemporaryUpload.objects.get(upload_id=text)
return tu.get_file_path()
def post(self, *args, **kwargs):
model = self.create_model()
example = self.prepare_example()
response = self.send_request(model=model, example=example)
return Response(response, status=status.HTTP_200_OK)
class LabelExtractorTesting(APIView):
permission_classes = [IsAuthenticated & IsProjectAdmin]
def post(self, *args, **kwargs):
response = self.request.data['response']
template = self.request.data['template']
task_type = self.request.data['task_type']
label_collection = get_label_collection(task_type)
template = MappingTemplate(
label_collection=label_collection,
template=template
)
try:
labels = template.render(response)
except json.decoder.JSONDecodeError:
raise TemplateMappingError()
if not labels.dict():
raise SampleDataException()
return Response(labels.dict(), status=status.HTTP_200_OK)
class LabelMapperTesting(APIView):
permission_classes = [IsAuthenticated & IsProjectAdmin]
def post(self, *args, **kwargs):
response = self.request.data['response']
task_type = self.request.data['task_type']
label_mapping = self.request.data['label_mapping']
label_collection = get_label_collection(task_type)
labels = label_collection(response)
post_processor = PostProcessor(label_mapping)
labels = post_processor.transform(labels)
return Response(labels.dict(), status=status.HTTP_200_OK)
class AutomatedLabeling(generics.CreateAPIView):
permission_classes = [IsAuthenticated & IsInProjectOrAdmin]
swagger_schema = None
def create(self, request, *args, **kwargs):
project = get_object_or_404(Project, pk=self.kwargs['project_id'])
example = project.examples.get(pk=self.request.query_params['example'])
configs = AutoLabelingConfig.objects.filter(project=project)
# Todo: make async calls or celery tasks to reduce waiting time.
for config in configs:
labels = execute_pipeline(example.data, config=config)
labels.save(project, example, self.request.user)
return Response({'ok': True}, status=status.HTTP_201_CREATED)