Reimplement logic of getting labels in coco converter (#319)

* Reimplement logic of getting labels in coco converter * Fixes in converter
cvat-ai · Apr 1, 2019 · 21de4cf · 21de4cf
1 parent e96d4fd
commit 21de4cf
Show file tree

Hide file tree

Showing 2 changed files with 92 additions and 48 deletions.
diff --git a/utils/coco/converter.md b/utils/coco/converter.md
@@ -24,13 +24,13 @@ $ cat ../requirements.txt requirements.txt | xargs -n 1 -L 1 pip install
 Run the script inside the virtual environment.
 
 ```bash
-python converter.py --cvat-xml </path/to/cvat/annotation.xml> --output </path/to/output/coco/annotation.json> --image-dir </path/to/directory/with/images> --draw </path/to/save/directory> --draw_labels --use_background_label
+python converter.py --cvat-xml </path/to/cvat/annotation.xml> --output </path/to/output/coco/annotation.json> --image-dir </path/to/directory/with/images> --labels </path/to/file/with/labels.txt> --draw </path/to/save/directory> --draw_labels --use_background_label
 ```
 
 Please run `python converter.py --help` for more details.
 
 #### Labels
-The script parses input annotation and find field `labels` to find which labels are presented. If were not found any labels in annotation, script try to parse text file `labels.txt` in the same directory as annotation. This file should include labels in one string separated by spaces or one label per string and also their combinations. For example:
+If '--labels' argument is used, the script gets names of labels from a file. If file with labels is not defined, the script parses input annotation and find field `labels` to find which labels are presented. File with labels should include labels in one string separated by spaces or one label per string and also their combinations. For example:
 ```
 label1 label2
 label3

diff --git a/utils/coco/converter.py b/utils/coco/converter.py
@@ -30,13 +30,17 @@ def parse_args():
         help='input file with CVAT annotation in *.xml format'
     )
     parser.add_argument(
-        '--output', required=True,
-        help='output annotation file'
+        '--output', default=None,
+        help='output annotation file. If not defined, the output file name will be created from input file name'
     )
     parser.add_argument(
         '--image-dir', required=True,
         help='directory with images from annotation'
     )
+    parser.add_argument(
+        '--labels', default=None,
+        help='path to file with labels'
+    )
     parser.add_argument(
         '--draw', default=None,
         help='directory to save images with its segments. By default is disabled'
@@ -89,6 +93,7 @@ def mask_to_polygon(mask, tolerance=1.0, area_threshold=1):
                 polygons.append(reshaped_contour)
     return polygons
 
+
 def draw_polygons(polygons, img_name, input_dir, output_dir, draw_labels):
     """Draw on image contours of its objects and save
     Args:
@@ -123,6 +128,7 @@ def draw_polygons(polygons, img_name, input_dir, output_dir, draw_labels):
                 cv2.putText(img, label, (x, y), cv2.FONT_HERSHEY_COMPLEX_SMALL, 1, red, 1)
     cv2.imwrite(output_file, img)
 
+
 def fix_segments_intersections(polygons, height, width, img_name, use_background_label,
                                threshold=0.0, ratio_tolerance=0.001, area_threshold=1):
     """Find all intersected regions and crop contour for back object by objects which
@@ -206,6 +212,7 @@ def fix_segments_intersections(polygons, height, width, img_name, use_background
 
     return output_polygons
 
+
 def polygon_area_and_bbox(polygon, height, width):
     """Calculate area of object's polygon and bounding box around it
     Args:
@@ -222,6 +229,7 @@ def polygon_area_and_bbox(polygon, height, width):
             max(bbox[:, 1] + bbox[:, 3]) - min(bbox[:, 1])]
     return area, bbox
 
+
 def insert_license_data(result_annotation):
     """Fill license fields in annotation by blank data
     Args:
@@ -233,6 +241,7 @@ def insert_license_data(result_annotation):
         'url': ''
     })
 
+
 def insert_info_data(xml_root, result_annotation):
     """Fill available information of annotation
     Args:
@@ -266,56 +275,84 @@ def insert_info_data(xml_root, result_annotation):
     }
     log.info('Found the next information data: {}'.format(result_annotation['info']))
 
-def insert_categories_data(xml_root, use_background_label, result_annotation, xml_dir):
+
+def insert_categories_data(xml_root, use_background_label, result_annotation, labels_file=None):
     """Get labels from input annotation and fill categories field in output annotation
     Args:
         xml_root: root for xml parser
         use_background_label: key to enable using label background
         result_annotation: output annotation in COCO representation
-        xml_dir: directory with input annotation
+        labels_file: path to file with labels names.
+                     If not defined, parse annotation to get labels names
     """
-    log.info('Reading labels...')
+    def get_categories(names, bg_found, use_background_label, sort=False):
+        bg_used = False
+        category_map = {}
+        categories = []
+        # Sort labels by its names to make the same order of ids for different annotations
+        if sort:
+            names.sort()
+        # Always use id = 0 for background
+        if bg_found and use_background_label:
+            category_map['background'] = 0
+            bg_used = True
+        cat_id = 1
+        # Define id for all labels beginning from 1
+        for name in names:
+            if name == 'background':
+                continue
+            category_map[name] = cat_id
+            categories.append({'id': cat_id, 'name': name, 'supercategory': ''})
+            cat_id += 1
+        return category_map, categories, bg_used
+
     categories = []
     category_map = {}
+    label_names = []
     bg_found = False
-    id = 0
-    for label in xml_root.iter('label'):
-        for name in label.findall("./name"):
-            if not use_background_label and name.text == 'background':
-                bg_found = True
-                continue
-            category_map[name.text] = id
-            categories.append({'id': id, 'name': name.text, 'supercategory': ''})
-            id += 1
+    bg_used = False
+
+    if labels_file is None:
+        log.info('Reading labels from annotation...')
+        for label in xml_root.iter('label'):
+            for name in label.findall("./name"):
+                if name.text == 'background':
+                    bg_found = True
+                    continue
+                label_names.append(name.text)
+        if len(label_names) == 0:
+            log.info('Labels in annotation were not found. Please use \'--labels\' argument to define file with labels.')
+        else:
+            category_map, categories, bg_used = get_categories(label_names, bg_found, use_background_label, sort=True)
+    else:
+        log.info('Parsing labels from file <{}>...'.format(labels_file))
+        with open(labels_file, 'r') as file:
+            string = '  '
+            while string != '' and string != '\n':
+                string = file.readline()
+                labels = string.split(' ')
+                for label in labels:
+                    if label == '\n' or label == '':
+                        continue
+                    label = label.replace('\n', '')
+                    if label == 'background':
+                        bg_found = True
+                        continue
+                    label_names.append(label)
+            category_map, categories, bg_used = get_categories(label_names, bg_found, use_background_label)
+
     if len(categories) == 0:
-        log.info('Labels in annotation were not found. Trying to find file <labels.txt> in <{}>'.format(xml_dir))
-        if osp.isfile(osp.join(xml_dir, 'labels.txt')):
-            labels_file = osp.join(xml_dir, 'labels.txt')
-            log.info('File <labels.txt> was found in <{}>. Reading...'.format(xml_dir))
-            with open(labels_file, 'r') as file:
-                string = '  '
-                id = 0
-                while string != '' and string != '\n':
-                    string = file.readline()
-                    labels = string.split(' ')
-                    for l in labels:
-                        if l == '\n':
-                            continue
-                        if not use_background_label and l == 'background':
-                            bg_found = True
-                            continue
-                        category_map[l] = id
-                        categories.append({'id': id, 'name': l, 'supercategory': ''})
-                        id += 1
+        raise ValueError('Categories list is empty. Something wrong.')
 
     result_annotation['categories'] = categories
     log.info('Found the next labels: {}'.format(category_map))
-    if bg_found:
+    if bg_found and not bg_used:
         log.warning('Label <background> was found but not used. '
                     'To enable it should use command line argument [--use_background_label]')
     return category_map
 
-def insert_image_data(image, path_to_images, result_annotation):
+
+def insert_image_data(image, result_annotation):
     """Get data from input annotation for image and fill fields for this image in output annotation
     Args:
         image: dictionary with data for image from original annotation
@@ -329,11 +366,11 @@ def insert_image_data(image, path_to_images, result_annotation):
     new_img['license'] = 0
     new_img['id'] = image['id']
     new_img['file_name'] = osp.basename(image['name'])
-    pic = cv2.imread(osp.join(path_to_images, new_img['file_name']))
-    new_img['height'] = pic.shape[0]
-    new_img['width'] = pic.shape[1]
+    new_img['height'] = int(image['height'])
+    new_img['width'] = int(image['width'])
     result_annotation['images'].append(new_img)
 
+
 def insert_annotation_data(image, category_map, segm_id, object, img_dims, result_annotation):
     """Get data from input annotation for object and fill fields for this object in output annotation
     Args:
@@ -359,10 +396,14 @@ def insert_annotation_data(image, category_map, segm_id, object, img_dims, resul
 def main():
     args = parse_args()
     xml_file_name = args.cvat_xml
-    output_file_name = args.output
+    if args.output is not None:
+        output_file_name = args.output
+    else:
+        output_file_name = args.cvat_xml.split('.xml')[0] + '.json'
+        log.info('Output file name set to: {}'.format(output_file_name))
     root = etree.parse(xml_file_name).getroot()
 
-    if args.draw != None:
+    if args.draw is not None:
         log.info('Draw key was enabled. Images will be saved in directory <{}>'.format(args.draw))
 
     result_annotation = {
@@ -375,7 +416,7 @@ def main():
 
     insert_license_data(result_annotation)
     insert_info_data(root, result_annotation)
-    category_map = insert_categories_data(root, args.use_background_label, result_annotation, osp.dirname(xml_file_name))
+    category_map = insert_categories_data(root, args.use_background_label, result_annotation, labels_file=args.labels)
 
     if len(category_map) == 0:
         sys.exit('Labels were not found. Be sure that annotation <{}> includes field <labels> or '
@@ -388,6 +429,9 @@ def main():
         image = {}
         for key, value in img.items():
             image[key] = value
+        img_name = osp.join(args.image_dir, osp.basename(image['name']))
+        if not osp.isfile(img_name):
+            log.warning('Image <{}> is not available'.format(img_name))
         image['polygon'] = []
         z_order_on_counter = 0
         polygon_counter = 0
@@ -407,7 +451,7 @@ def main():
 
         # Create new image
         image['id'] = int(image['id'])
-        insert_image_data(image, args.image_dir, result_annotation)
+        insert_image_data(image, result_annotation)
         height = result_annotation['images'][-1]['height']
         width = result_annotation['images'][-1]['width']
         image['polygon'] = fix_segments_intersections(image['polygon'], height, width,
@@ -420,7 +464,7 @@ def main():
             segm_id += 1
 
         # Draw contours of objects on image
-        if args.draw != None:
+        if args.draw is not None:
             draw_polygons(image['polygon'], image['name'], args.image_dir, args.draw, args.draw_labels)
 
     log.info('Processed images: {}'.format(len(result_annotation['images'])))
@@ -438,12 +482,12 @@ def main():
     # Try to load created annotation via cocoapi
     try:
         log.info('Trying to load annotation <{}> via cocoapi...'.format(output_file_name))
-        anno = coco_loader.COCO(output_file_name)
+        coco_loader.COCO(output_file_name)
     except:
         raise
     else:
-        log.info('Annotation in COCO representation <{}> created from <{}> successfully!'
-                 .format(output_file_name, xml_file_name))
+        log.info('Conversion <{}> --> <{}> has finished successfully!'.format(xml_file_name, output_file_name))
+
 
 if __name__ == "__main__":
     main()