doccano/backend/data_export/tests/test_task.py


								import os

								import zipfile


								import pandas as pd

								from django.test import TestCase, override_settings

								from model_mommy import mommy


								from ..celery_tasks import export_dataset

								from data_export.models import DATA

								from projects.models import ProjectType

								from projects.tests.utils import prepare_project


								def read_zip_content(file):

								    datasets = {}

								    with zipfile.ZipFile(file) as z:

								        for file in z.filelist:

								            username = file.filename.split(".")[0]

								            with z.open(file) as f:

								                try:

								                    df = pd.read_json(f, lines=True)

								                except pd.errors.EmptyDataError:

								                    continue

								            datasets[username] = df.to_dict(orient="records")

								    return datasets


								@override_settings(MEDIA_URL=os.path.dirname(__file__))

								class TestExport(TestCase):

								    def export_dataset(self, confirmed_only=False):

								        file = export_dataset(self.project.id, "JSONL", confirmed_only)

								        if self.project.item.collaborative_annotation:

								            dataset = pd.read_json(file, lines=True).to_dict(orient="records")

								        else:

								            dataset = read_zip_content(file)

								        os.remove(file)

								        return dataset


								    def data_to_text(self, example):

								        d = example.to_dict()

								        d["text"] = d.pop(DATA)

								        return d


								    def data_to_filename(self, example):

								        d = example.to_dict(is_text_project=False)

								        d["filename"] = d.pop(DATA)

								        return d


								class TestExportCategory(TestExport):

								    def prepare_data(self, collaborative=False):

								        self.project = prepare_project(ProjectType.DOCUMENT_CLASSIFICATION, collaborative_annotation=collaborative)

								        self.example1 = mommy.make("ExportedExample", project=self.project.item, text="example1")

								        self.example2 = mommy.make("ExportedExample", project=self.project.item, text="example2")

								        self.category1 = mommy.make("ExportedCategory", example=self.example1, user=self.project.admin)

								        self.category2 = mommy.make("ExportedCategory", example=self.example1, user=self.project.annotator)

								        self.comment1 = mommy.make("ExportedComment", example=self.example1, user=self.project.admin)

								        self.comment2 = mommy.make("ExportedComment", example=self.example1, user=self.project.annotator)

								        mommy.make("ExampleState", example=self.example1, confirmed_by=self.project.admin)

								        self.data1 = self.data_to_text(self.example1)

								        self.data2 = self.data_to_text(self.example2)


								    def test_unconfirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset()

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, "label": [self.category1.to_string()], "Comments": [self.comment1.to_string()]},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								            self.project.approver.username: [

								                {**self.data1, "label": [], "Comments": []},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								            self.project.annotator.username: [

								                {**self.data1, "label": [self.category2.to_string()], "Comments": [self.comment2.to_string()]},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(datasets[username], dataset)


								    def test_unconfirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset()

								        expected_dataset = [

								            {

								                **self.data1,

								                "label": sorted([self.category1.to_string(), self.category2.to_string()]),

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            },

								            {**self.data2, "label": [], "Comments": []},

								        ]

								        self.assertEqual(dataset, expected_dataset)


								    def test_confirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset(confirmed_only=True)

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, "label": [self.category1.to_string()], "Comments": [self.comment1.to_string()]}

								            ]

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(datasets[username], dataset)


								    def test_confirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset(confirmed_only=True)

								        expected_dataset = [

								            {

								                **self.data1,

								                "label": sorted([self.category1.to_string(), self.category2.to_string()]),

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            }

								        ]

								        self.assertEqual(dataset, expected_dataset)


								class TestExportSeq2seq(TestExport):

								    def prepare_data(self, collaborative=False):

								        self.project = prepare_project(ProjectType.SEQ2SEQ, collaborative_annotation=collaborative)

								        self.example1 = mommy.make("ExportedExample", project=self.project.item, text="confirmed")

								        self.example2 = mommy.make("ExportedExample", project=self.project.item, text="unconfirmed")

								        self.text1 = mommy.make("TextLabel", example=self.example1, user=self.project.admin)

								        self.text2 = mommy.make("TextLabel", example=self.example1, user=self.project.annotator)

								        self.comment1 = mommy.make("ExportedComment", example=self.example1, user=self.project.admin)

								        self.comment2 = mommy.make("ExportedComment", example=self.example1, user=self.project.annotator)

								        mommy.make("ExampleState", example=self.example1, confirmed_by=self.project.admin)

								        self.data1 = self.data_to_text(self.example1)

								        self.data2 = self.data_to_text(self.example2)


								    def test_unconfirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset()

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, "label": [self.text1.text], "Comments": [self.comment1.to_string()]},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								            self.project.approver.username: [

								                {**self.data1, "label": [], "Comments": []},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								            self.project.annotator.username: [

								                {**self.data1, "label": [self.text2.text], "Comments": [self.comment2.to_string()]},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(datasets[username], dataset)


								    def test_unconfirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset()

								        expected_dataset = [

								            {

								                **self.data1,

								                "label": sorted([self.text1.text, self.text2.text]),

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            },

								            {**self.data2, "label": [], "Comments": []},

								        ]

								        self.assertEqual(dataset, expected_dataset)


								    def test_confirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset(confirmed_only=True)

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, "label": [self.text1.text], "Comments": [self.comment1.to_string()]},

								            ],

								            self.project.approver.username: [],

								            self.project.annotator.username: [],

								        }

								        for username, dataset in datasets.items():

								            self.assertEqual(dataset, expected_datasets[username])


								    def test_confirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset(confirmed_only=True)

								        expected_dataset = [

								            {

								                **self.data1,

								                "label": sorted([self.text1.text, self.text2.text]),

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            }

								        ]

								        self.assertEqual(dataset, expected_dataset)


								class TestExportIntentDetectionAndSlotFilling(TestExport):

								    def prepare_data(self, collaborative=False):

								        self.project = prepare_project(

								            ProjectType.INTENT_DETECTION_AND_SLOT_FILLING, collaborative_annotation=collaborative

								        )

								        self.example1 = mommy.make("ExportedExample", project=self.project.item, text="confirmed")

								        self.example2 = mommy.make("ExportedExample", project=self.project.item, text="unconfirmed")

								        self.category1 = mommy.make("ExportedCategory", example=self.example1, user=self.project.admin)

								        self.category2 = mommy.make("ExportedCategory", example=self.example1, user=self.project.annotator)

								        self.comment1 = mommy.make("ExportedComment", example=self.example1, user=self.project.admin)

								        self.comment2 = mommy.make("ExportedComment", example=self.example1, user=self.project.annotator)

								        self.span = mommy.make(

								            "ExportedSpan", example=self.example1, user=self.project.admin, start_offset=0, end_offset=1

								        )

								        mommy.make("ExampleState", example=self.example1, confirmed_by=self.project.admin)

								        self.data1 = self.data_to_text(self.example1)

								        self.data2 = self.data_to_text(self.example2)


								    def test_unconfirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset()

								        expected_datasets = {

								            self.project.admin.username: [

								                {

								                    **self.data1,

								                    "entities": [list(self.span.to_tuple())],

								                    "cats": [self.category1.to_string()],

								                    "Comments": [self.comment1.to_string()],

								                },

								                {**self.data2, "entities": [], "cats": [], "Comments": []},

								            ],

								            self.project.annotator.username: [

								                {

								                    **self.data1,

								                    "entities": [],

								                    "cats": [self.category2.to_string()],

								                    "Comments": [self.comment2.to_string()],

								                },

								                {**self.data2, "entities": [], "cats": [], "Comments": []},

								            ],

								            self.project.approver.username: [

								                {**self.data1, "entities": [], "cats": [], "Comments": []},

								                {**self.data2, "entities": [], "cats": [], "Comments": []},

								            ],

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(dataset, datasets[username])


								    def test_unconfirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset()

								        expected_dataset = [

								            {

								                **self.data1,

								                "entities": [list(self.span.to_tuple())],

								                "cats": sorted([self.category1.to_string(), self.category2.to_string()]),

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            },

								            {**self.data2, "entities": [], "cats": [], "Comments": []},

								        ]

								        self.assertEqual(dataset, expected_dataset)


								    def test_confirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset(confirmed_only=True)

								        expected_datasets = {

								            self.project.admin.username: [

								                {

								                    **self.data1,

								                    "entities": [list(self.span.to_tuple())],

								                    "cats": [self.category1.to_string()],

								                    "Comments": [self.comment1.to_string()],

								                },

								            ],

								            self.project.annotator.username: [],

								            self.project.approver.username: [],

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(dataset, datasets[username])


								    def test_confirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset(confirmed_only=True)

								        expected_dataset = [

								            {

								                **self.data1,

								                "entities": [list(self.span.to_tuple())],

								                "cats": sorted([self.category1.to_string(), self.category2.to_string()]),

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            },

								        ]

								        self.assertEqual(dataset, expected_dataset)


								class TestExportSequenceLabeling(TestExport):

								    def prepare_data(self, collaborative=False):

								        self.project = prepare_project(ProjectType.SEQUENCE_LABELING, collaborative_annotation=collaborative)

								        self.example1 = mommy.make("ExportedExample", project=self.project.item, text="confirmed")

								        self.span1 = mommy.make(

								            "ExportedSpan", example=self.example1, user=self.project.admin, start_offset=0, end_offset=1

								        )

								        self.span2 = mommy.make(

								            "ExportedSpan", example=self.example1, user=self.project.annotator, start_offset=1, end_offset=2

								        )

								        mommy.make("ExampleState", example=self.example1, confirmed_by=self.project.admin)

								        self.example2 = mommy.make("ExportedExample", project=self.project.item, text="unconfirmed")

								        self.comment1 = mommy.make("ExportedComment", example=self.example1, user=self.project.admin)

								        self.comment2 = mommy.make("ExportedComment", example=self.example1, user=self.project.annotator)

								        self.data1 = self.data_to_text(self.example1)

								        self.data2 = self.data_to_text(self.example2)


								    def test_unconfirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset()

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, "label": [list(self.span1.to_tuple())], "Comments": [self.comment1.to_string()]},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								            self.project.annotator.username: [

								                {**self.data1, "label": [list(self.span2.to_tuple())], "Comments": [self.comment2.to_string()]},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								            self.project.approver.username: [

								                {**self.data1, "label": [], "Comments": []},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(dataset, datasets[username])


								    def test_unconfirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset()

								        expected_dataset = [

								            {

								                **self.data1,

								                "label": [list(self.span1.to_tuple()), list(self.span2.to_tuple())],

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            },

								            {**self.data2, "label": [], "Comments": []},

								        ]

								        self.assertEqual(dataset, expected_dataset)


								    def test_confirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset(confirmed_only=True)

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, "label": [list(self.span1.to_tuple())], "Comments": [self.comment1.to_string()]},

								            ],

								            self.project.annotator.username: [],

								            self.project.approver.username: [],

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(dataset, datasets[username])


								    def test_confirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset(confirmed_only=True)

								        expected_dataset = [

								            {

								                **self.data1,

								                "label": [list(self.span1.to_tuple()), list(self.span2.to_tuple())],

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            },

								        ]

								        self.assertEqual(dataset, expected_dataset)


								class TestExportSpeechToText(TestExport):

								    def prepare_data(self, collaborative=False):

								        self.project = prepare_project(ProjectType.SPEECH2TEXT, collaborative_annotation=collaborative)

								        self.example1 = mommy.make("ExportedExample", project=self.project.item, text="confirmed")

								        self.example2 = mommy.make("ExportedExample", project=self.project.item, text="unconfirmed")

								        self.text1 = mommy.make("TextLabel", example=self.example1, user=self.project.admin)

								        self.text2 = mommy.make("TextLabel", example=self.example1, user=self.project.annotator)

								        self.comment1 = mommy.make("ExportedComment", example=self.example1, user=self.project.admin)

								        self.comment2 = mommy.make("ExportedComment", example=self.example1, user=self.project.annotator)

								        mommy.make("ExampleState", example=self.example1, confirmed_by=self.project.admin)

								        self.data1 = self.data_to_filename(self.example1)

								        self.data2 = self.data_to_filename(self.example2)


								    def test_unconfirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset()

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, "label": [self.text1.text], "Comments": [self.comment1.to_string()]},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								            self.project.approver.username: [

								                {**self.data1, "label": [], "Comments": []},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								            self.project.annotator.username: [

								                {**self.data1, "label": [self.text2.text], "Comments": [self.comment2.to_string()]},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(datasets[username], dataset)


								    def test_unconfirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset()

								        expected_dataset = [

								            {

								                **self.data1,

								                "label": sorted([self.text1.text, self.text2.text]),

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            },

								            {**self.data2, "label": [], "Comments": []},

								        ]

								        self.assertEqual(dataset, expected_dataset)


								    def test_confirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset(confirmed_only=True)

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, "label": [self.text1.text], "Comments": [self.comment1.to_string()]},

								            ],

								            self.project.annotator.username: [],

								            self.project.approver.username: [],

								        }

								        for username, dataset in datasets.items():

								            self.assertEqual(dataset, expected_datasets[username])


								    def test_confirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset(confirmed_only=True)

								        expected_dataset = [

								            {

								                **self.data1,

								                "label": sorted([self.text1.text, self.text2.text]),

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            }

								        ]

								        self.assertEqual(dataset, expected_dataset)


								class TestExportImageClassification(TestExport):

								    def prepare_data(self, collaborative=False):

								        self.project = prepare_project(ProjectType.IMAGE_CLASSIFICATION, collaborative_annotation=collaborative)

								        self.example1 = mommy.make("ExportedExample", project=self.project.item, text="confirmed")

								        self.example2 = mommy.make("ExportedExample", project=self.project.item, text="unconfirmed")

								        self.category1 = mommy.make("ExportedCategory", example=self.example1, user=self.project.admin)

								        self.category2 = mommy.make("ExportedCategory", example=self.example1, user=self.project.annotator)

								        self.comment1 = mommy.make("ExportedComment", example=self.example1, user=self.project.admin)

								        self.comment2 = mommy.make("ExportedComment", example=self.example1, user=self.project.annotator)

								        mommy.make("ExampleState", example=self.example1, confirmed_by=self.project.admin)

								        self.data1 = self.data_to_filename(self.example1)

								        self.data2 = self.data_to_filename(self.example2)


								    def test_unconfirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset()

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, "label": [self.category1.to_string()], "Comments": [self.comment1.to_string()]},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								            self.project.approver.username: [

								                {**self.data1, "label": [], "Comments": []},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								            self.project.annotator.username: [

								                {**self.data1, "label": [self.category2.to_string()], "Comments": [self.comment2.to_string()]},

								                {**self.data2, "label": [], "Comments": []},

								            ],

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(datasets[username], dataset)


								    def test_unconfirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset()

								        expected_dataset = [

								            {

								                **self.data1,

								                "label": sorted([self.category1.to_string(), self.category2.to_string()]),

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            },

								            {**self.data2, "label": [], "Comments": []},

								        ]

								        self.assertEqual(dataset, expected_dataset)


								    def test_confirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset(confirmed_only=True)

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, "label": [self.category1.to_string()], "Comments": [self.comment1.to_string()]}

								            ]

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(datasets[username], dataset)


								    def test_confirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset(confirmed_only=True)

								        expected_dataset = [

								            {

								                **self.data1,

								                "label": sorted([self.category1.to_string(), self.category2.to_string()]),

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            }

								        ]

								        self.assertEqual(dataset, expected_dataset)


								class TestExportBoundingBox(TestExport):

								    def prepare_data(self, collaborative=False):

								        self.project = prepare_project(ProjectType.BOUNDING_BOX, collaborative_annotation=collaborative)

								        self.example1 = mommy.make("ExportedExample", project=self.project.item, text="confirmed")

								        self.example2 = mommy.make("ExportedExample", project=self.project.item, text="unconfirmed")

								        self.comment1 = mommy.make("ExportedComment", example=self.example1, user=self.project.admin)

								        self.comment2 = mommy.make("ExportedComment", example=self.example1, user=self.project.annotator)

								        self.bbox1 = mommy.make(

								            "ExportedBoundingBox", example=self.example1, user=self.project.admin, x=0, y=0, width=10, height=10

								        )

								        self.bbox2 = mommy.make(

								            "ExportedBoundingBox", example=self.example1, user=self.project.annotator, x=10, y=10, width=20, height=20

								        )

								        mommy.make("ExampleState", example=self.example1, confirmed_by=self.project.admin)

								        self.data1 = self.data_to_filename(self.example1)

								        self.data2 = self.data_to_filename(self.example2)


								    def test_unconfirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset()

								        expected_datasets = {

								            self.project.admin.username: [

								                {

								                    **self.data1,

								                    "bbox": [self.bbox1.to_dict()],

								                    "Comments": [self.comment1.to_dict()],

								                },

								                {**self.data2, "bbox": [], "Comments": []},

								            ],

								            self.project.approver.username: [

								                {**self.data1, "bbox": [], "Comments": []},

								                {**self.data2, "bbox": [], "Comments": []},

								            ],

								            self.project.annotator.username: [

								                {**self.data1, "bbox": [self.bbox2.to_dict()], "Comments": [self.comment2.to_dict()]},

								                {**self.data2, "bbox": [], "Comments": []},

								            ],

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(datasets[username], dataset)


								    def test_unconfirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset()

								        expected_dataset = [

								            {

								                **self.data1,

								                "bbox": [self.bbox1.to_dict(), self.bbox2.to_dict()],

								                "Comments": [self.comment1.to_dict(), self.comment2.to_dict()],

								            },

								            {**self.data2, "bbox": [], "Comments": []},

								        ]

								        self.assertEqual(dataset, expected_dataset)


								    def test_confirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset(confirmed_only=True)

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, "bbox": [self.bbox1.to_dict()], "Comments": [self.comment1.to_dict()]}

								            ]

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(datasets[username], dataset)


								    def test_confirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset(confirmed_only=True)

								        expected_dataset = [

								            {

								                **self.data1,

								                "bbox": [self.bbox1.to_dict(), self.bbox2.to_dict()],

								                "Comments": [self.comment1.to_dict(), self.comment2.to_dict()],

								            }

								        ]

								        self.assertEqual(dataset, expected_dataset)


								class TestExportSegmentation(TestExport):

								    def prepare_data(self, collaborative=False):

								        self.project = prepare_project(ProjectType.SEGMENTATION, collaborative_annotation=collaborative)

								        self.example1 = mommy.make("ExportedExample", project=self.project.item, text="confirmed")

								        self.example2 = mommy.make("ExportedExample", project=self.project.item, text="unconfirmed")

								        self.comment1 = mommy.make("ExportedComment", example=self.example1, user=self.project.admin)

								        self.comment2 = mommy.make("ExportedComment", example=self.example1, user=self.project.annotator)

								        self.seg1 = mommy.make("ExportedSegmentation", example=self.example1, user=self.project.admin, points=[0, 1])

								        self.seg2 = mommy.make(

								            "ExportedSegmentation", example=self.example1, user=self.project.annotator, points=[1, 2]

								        )

								        mommy.make("ExampleState", example=self.example1, confirmed_by=self.project.admin)

								        self.data1 = self.data_to_filename(self.example1)

								        self.data2 = self.data_to_filename(self.example2)

								        self.column = "segmentation"


								    def test_unconfirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset()

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, self.column: [self.seg1.to_dict()], "Comments": [self.comment1.to_dict()]},

								                {**self.data2, self.column: [], "Comments": []},

								            ],

								            self.project.approver.username: [

								                {**self.data1, self.column: [], "Comments": []},

								                {**self.data2, self.column: [], "Comments": []},

								            ],

								            self.project.annotator.username: [

								                {**self.data1, self.column: [self.seg2.to_dict()], "Comments": [self.comment2.to_dict()]},

								                {**self.data2, self.column: [], "Comments": []},

								            ],

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(datasets[username], dataset)


								    def test_unconfirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset()

								        expected_dataset = [

								            {

								                **self.data1,

								                self.column: [self.seg1.to_dict(), self.seg2.to_dict()],

								                "Comments": [self.comment1.to_dict(), self.comment2.to_dict()],

								            },

								            {**self.data2, self.column: [], "Comments": []},

								        ]

								        self.assertEqual(dataset, expected_dataset)


								    def test_confirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset(confirmed_only=True)

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, self.column: [self.seg1.to_dict()], "Comments": [self.comment1.to_dict()]}

								            ]

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(datasets[username], dataset)


								    def test_confirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset(confirmed_only=True)

								        expected_dataset = [

								            {

								                **self.data1,

								                self.column: [self.seg1.to_dict(), self.seg2.to_dict()],

								                "Comments": [self.comment1.to_dict(), self.comment2.to_dict()],

								            }

								        ]

								        self.assertEqual(dataset, expected_dataset)


								class TestExportImageCaptioning(TestExport):

								    def prepare_data(self, collaborative=False):

								        self.project = prepare_project(ProjectType.IMAGE_CAPTIONING, collaborative_annotation=collaborative)

								        self.example1 = mommy.make("ExportedExample", project=self.project.item, text="confirmed")

								        self.example2 = mommy.make("ExportedExample", project=self.project.item, text="unconfirmed")

								        self.comment1 = mommy.make("ExportedComment", example=self.example1, user=self.project.admin)

								        self.comment2 = mommy.make("ExportedComment", example=self.example1, user=self.project.annotator)

								        self.text1 = mommy.make("TextLabel", example=self.example1, user=self.project.admin)

								        self.text2 = mommy.make("TextLabel", example=self.example1, user=self.project.annotator)

								        mommy.make("ExampleState", example=self.example1, confirmed_by=self.project.admin)

								        self.data1 = self.data_to_filename(self.example1)

								        self.data2 = self.data_to_filename(self.example2)

								        self.column = "label"


								    def test_unconfirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset()

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, self.column: [self.text1.text], "Comments": [self.comment1.to_string()]},

								                {**self.data2, self.column: [], "Comments": []},

								            ],

								            self.project.approver.username: [

								                {**self.data1, self.column: [], "Comments": []},

								                {**self.data2, self.column: [], "Comments": []},

								            ],

								            self.project.annotator.username: [

								                {**self.data1, self.column: [self.text2.text], "Comments": [self.comment2.to_string()]},

								                {**self.data2, self.column: [], "Comments": []},

								            ],

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(datasets[username], dataset)


								    def test_unconfirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset()

								        expected_dataset = [

								            {

								                **self.data1,

								                self.column: sorted([self.text1.text, self.text2.text]),

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            },

								            {**self.data2, self.column: [], "Comments": []},

								        ]

								        self.assertEqual(dataset, expected_dataset)


								    def test_confirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset(confirmed_only=True)

								        expected_datasets = {

								            self.project.admin.username: [

								                {**self.data1, self.column: [self.text1.text], "Comments": [self.comment1.to_string()]},

								            ],

								            self.project.approver.username: [],

								            self.project.annotator.username: [],

								        }

								        for username, dataset in datasets.items():

								            self.assertEqual(dataset, expected_datasets[username])


								    def test_confirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset(confirmed_only=True)

								        expected_dataset = [

								            {

								                **self.data1,

								                self.column: sorted([self.text1.text, self.text2.text]),

								                "Comments": sorted([self.comment1.to_string(), self.comment2.to_string()]),

								            }

								        ]

								        self.assertEqual(dataset, expected_dataset)


								class TestExportRelation(TestExport):

								    def prepare_data(self, collaborative=False):

								        self.project = prepare_project(

								            ProjectType.SEQUENCE_LABELING, use_relation=True, collaborative_annotation=collaborative

								        )

								        self.example1 = mommy.make("ExportedExample", project=self.project.item, text="example")

								        self.example2 = mommy.make("ExportedExample", project=self.project.item, text="unconfirmed")

								        self.span1 = mommy.make(

								            "ExportedSpan", example=self.example1, user=self.project.admin, start_offset=0, end_offset=1

								        )

								        self.span2 = mommy.make(

								            "ExportedSpan", example=self.example1, user=self.project.admin, start_offset=1, end_offset=2

								        )

								        self.span3 = mommy.make(

								            "ExportedSpan", example=self.example1, user=self.project.annotator, start_offset=2, end_offset=3

								        )

								        self.relation = mommy.make(

								            "ExportedRelation", from_id=self.span1, to_id=self.span2, example=self.example1, user=self.project.admin

								        )

								        self.comment1 = mommy.make("ExportedComment", example=self.example1, user=self.project.admin)

								        self.comment2 = mommy.make("ExportedComment", example=self.example1, user=self.project.annotator)

								        mommy.make("ExampleState", example=self.example1, confirmed_by=self.project.admin)

								        self.data1 = self.data_to_text(self.example1)

								        self.data2 = self.data_to_text(self.example2)


								    def test_unconfirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset()

								        expected_datasets = {

								            self.project.admin.username: [

								                {

								                    **self.data1,

								                    "entities": [self.span1.to_dict(), self.span2.to_dict()],

								                    "relations": [self.relation.to_dict()],

								                    "Comments": [self.comment1.to_dict()],

								                },

								                {**self.data2, "entities": [], "relations": [], "Comments": []},

								            ],

								            self.project.annotator.username: [

								                {

								                    **self.data1,

								                    "entities": [self.span3.to_dict()],

								                    "relations": [],

								                    "Comments": [self.comment2.to_dict()],

								                },

								                {**self.data2, "entities": [], "relations": [], "Comments": []},

								            ],

								            self.project.approver.username: [

								                {**self.data1, "entities": [], "relations": [], "Comments": []},

								                {**self.data2, "entities": [], "relations": [], "Comments": []},

								            ],

								        }

								        for username, dataset in expected_datasets.items():

								            self.assertEqual(datasets[username], dataset)


								    def test_unconfirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset()

								        expected_dataset = [

								            {

								                **self.data1,

								                "entities": [self.span1.to_dict(), self.span2.to_dict(), self.span3.to_dict()],

								                "relations": [self.relation.to_dict()],

								                "Comments": [self.comment1.to_dict(), self.comment2.to_dict()],

								            },

								            {**self.data2, "entities": [], "relations": [], "Comments": []},

								        ]

								        self.assertEqual(dataset, expected_dataset)


								    def test_confirmed_and_non_collaborative(self):

								        self.prepare_data()

								        datasets = self.export_dataset(confirmed_only=True)

								        expected_datasets = {

								            self.project.admin.username: [

								                {

								                    **self.data1,

								                    "entities": [self.span1.to_dict(), self.span2.to_dict()],

								                    "relations": [self.relation.to_dict()],

								                    "Comments": [self.comment1.to_dict()],

								                },

								            ],

								            self.project.annotator.username: [],

								            self.project.approver.username: [],

								        }

								        for username, dataset in datasets.items():

								            self.assertEqual(dataset, expected_datasets[username])


								    def test_confirmed_and_collaborative(self):

								        self.prepare_data(collaborative=True)

								        dataset = self.export_dataset(confirmed_only=True)

								        expected_dataset = [

								            {

								                **self.data1,

								                "entities": [self.span1.to_dict(), self.span2.to_dict(), self.span3.to_dict()],

								                "relations": [self.relation.to_dict()],

								                "Comments": [self.comment1.to_dict(), self.comment2.to_dict()],

								            }

								        ]

								        self.assertEqual(dataset, expected_dataset)