MS COCO數據標注詳解

本文轉載自查看原文 2019-03-27 15:36 2604 Object Detection

轉發：https://blog.csdn.net/wc781708249/article/details/79603522

參考：

cocodataset/cocoapi
philferriere/cocoapi- support Windows build and python3
COCO 標注詳解
COCO數據集annotation內容
Dataset - COCO Dataset 數據特點

JSON文件
打開JSON文件查看數據特點
Object Instance 類型的標注格式
Object Keypoint 類型的標注格式
Image Caption的標注格式

JSON文件

json文件主要包含以下幾個字段：
詳細描述參考 COCO 標注詳解

{
    "info": info, # dict
    "licenses": [license], # list ，內部是dict
    "images": [image], # list ，內部是dict
    "annotations": [annotation], # list ，內部是dict
    "categories": # list ，內部是dict
}

打開JSON文件查看數據特點

由於JSON文件太大，很多都是重復定義的，所以只提取一張圖片，存儲成新的JSON文件，便於觀察。

# -*- coding:utf-8 -*-

from __future__ import print_function
from pycocotools.coco import COCO
import os, sys, zipfile
import urllib.request
import shutil
import numpy as np
import skimage.io as io
import matplotlib.pyplot as plt
import pylab
import json

json_file='./annotations/instances_val2017.json' # # Object Instance 類型的標注
# person_keypoints_val2017.json # Object Keypoint 類型的標注格式
# captions_val2017.json # Image Caption的標注格式

data=json.load(open(json_file,'r'))

data_2={}
data_2['info']=data['info']
data_2['licenses']=data['licenses']
data_2['images']=[data['images'][0]] # 只提取第一張圖片
data_2['categories']=data['categories']
annotation=[]

# 通過imgID 找到其所有對象
imgID=data_2['images'][0]['id']
for ann in data['annotations']:
    if ann['image_id']==imgID:
        annotation.append(ann)

data_2['annotations']=annotation

# 保存到新的JSON文件，便於查看數據特點
json.dump(data_2,open('./new_instances_val2017.json','w'),indent=4) # indent=4 更加美觀顯示

Object Instance 類型的標注格式

主要有以下幾個字段：

這里寫圖片描述

info

"info": { # 數據集信息描述
        "description": "COCO 2017 Dataset", # 數據集描述
        "url": "http://cocodataset.org", # 下載地址
        "version": "1.0", # 版本
        "year": 2017, # 年份
        "contributor": "COCO Consortium", # 提供者
        "date_created": "2017/09/01" # 數據創建日期
    },

licenses

"licenses": [
        {
            "url": "http://creativecommons.org/licenses/by-nc-sa/2.0/",
            "id": 1,
            "name": "Attribution-NonCommercial-ShareAlike License"
        },
        ……
        ……
    ],

images

"images": [
        {
            "license": 4,
            "file_name": "000000397133.jpg", # 圖片名
            "coco_url":  "http://images.cocodataset.org/val2017/000000397133.jpg",# 網路地址路徑
            "height": 427, # 高
            "width": 640, # 寬
            "date_captured": "2013-11-14 17:02:52", # 數據獲取日期
            "flickr_url": "http://farm7.staticflickr.com/6116/6255196340_da26cf2c9e_z.jpg",# flickr網路地址
            "id": 397133 # 圖片的ID編號（每張圖片ID是唯一的）
        },
        ……
        ……
    ],

annotations

"annotation": [
        {
            "segmentation": [ # 對象的邊界點（邊界多邊形）
                [
                    224.24,297.18,# 第一個點 x,y坐標
                    228.29,297.18, # 第二個點 x,y坐標
                    234.91,298.29,
                    ……
                    ……
                    225.34,297.55
                ]
            ],
            "area": 1481.3806499999994, # 區域面積
            "iscrowd": 0, # 
            "image_id": 397133, # 對應的圖片ID（與images中的ID對應）
            "bbox": [217.62,240.54,38.99,57.75], # 定位邊框 [x,y,w,h]
            "category_id": 44, # 類別ID（與categories中的ID對應）
            "id": 82445 # 對象ID，因為每一個圖像有不止一個對象，所以要對每一個對象編號（每個對象的ID是唯一的）
        },
        ……
        ……
        ]

注意，單個的對象（iscrowd=0)可能需要多個polygon來表示，比如這個對象在圖像中被擋住了。而iscrowd=1時（將標注一組對象，比如一群人）的segmentation使用的就是RLE格式。

可視化

現在調用cocoapi顯示剛生成的JSON文件，並檢查是否有問題。

# -*- coding:utf-8 -*-

from __future__ import print_function
from pycocotools.coco import COCO
import os, sys, zipfile
import urllib.request
import shutil
import numpy as np
import skimage.io as io
import matplotlib.pyplot as plt
import pylab
pylab.rcParams['figure.figsize'] = (8.0, 10.0)

annFile='./new_instances_val2017.json'
coco=COCO(annFile)

# display COCO categories and supercategories
cats = coco.loadCats(coco.getCatIds())
nms=[cat['name'] for cat in cats]
print('COCO categories: \n{}\n'.format(' '.join(nms)))

nms = set([cat['supercategory'] for cat in cats])
print('COCO supercategories: \n{}'.format(' '.join(nms)))

# imgIds = coco.getImgIds(imgIds = [324158])
imgIds = coco.getImgIds()
img = coco.loadImgs(imgIds[0])[0]
dataDir = '.'
dataType = 'val2017'
I = io.imread('%s/%s/%s'%(dataDir,dataType,img['file_name']))

plt.axis('off')
plt.imshow(I)
plt.show()


# load and display instance annotations
# 加載實例掩膜
# catIds = coco.getCatIds(catNms=['person','dog','skateboard']);
# catIds=coco.getCatIds()
catIds=[]
for ann in coco.dataset['annotations']:
    if ann['image_id']==imgIds[0]:
        catIds.append(ann['category_id'])

plt.imshow(I); plt.axis('off')
annIds = coco.getAnnIds(imgIds=img['id'], catIds=catIds, iscrowd=None)
anns = coco.loadAnns(annIds)
coco.showAnns(anns)

# initialize COCO api for person keypoints annotations
annFile = '{}/annotations/person_keypoints_{}.json'.format(dataDir,dataType)
coco_kps=COCO(annFile)

# load and display keypoints annotations
# 加載肢體關鍵點
plt.imshow(I); plt.axis('off')
ax = plt.gca()
annIds = coco_kps.getAnnIds(imgIds=img['id'], catIds=catIds, iscrowd=None)
anns = coco_kps.loadAnns(annIds)
coco_kps.showAnns(anns)

# initialize COCO api for caption annotations
annFile = '{}/annotations/captions_{}.json'.format(dataDir,dataType)
coco_caps=COCO(annFile)

# load and display caption annotations
# 加載文本描述
annIds = coco_caps.getAnnIds(imgIds=img['id']);
anns = coco_caps.loadAnns(annIds)
coco_caps.showAnns(anns)
plt.imshow(I); plt.axis('off'); plt.show()

這里寫圖片描述

A man is in a kitchen making pizzas.
Man in apron standing on front of oven with pans and bakeware
A baker is working in the kitchen rolling dough.
A person standing by a stove in a kitchen.
A table with pies being made and a person standing near a wall with pots and pans hanging on the wall.
   
   
   
           
  
  
  
          
   
   
   
           1
   
   
   
           2
   
   
   
           3
   
   
   
           4
   
   
   
           5

仿照COCO JSON文件

仿照COCO的數據格式，將labelme的JSON改造成COCO的JSON

首先是要`labelme`做好圖片標注

這里寫圖片描述

說明：（類別不一定對，只是為了說明問題）
bobcat-美國短耳貓
plushcat-布偶貓
deerhound-小鹿犬
mainecat-緬因貓
golden-金毛

將labelme的JSON轉成COCO格式JSON

這里寫一個class實現以下功能，labelme2COCO.py中的部分代碼如下：

def image(self,data,num):
        image={}
        img = utils.img_b64_to_array(data['imageData'])  # 解析原圖片數據
        # img=io.imread(data['imagePath']) # 通過圖片路徑打開圖片
        # img = cv2.imread(data['imagePath'], 0)
        height, width = img.shape[:2]
        img = None
        image['height']=height
        image['width'] = width
        image['id']=num+1
        image['file_name'] = data['imagePath'].split('/')[-1]

        self.height=height
        self.width=width

        return image

   def categorie(self,label):
       categorie={}
       categorie['supercategory'] = label[0]
       categorie['id']=len(self.label)+1 # 0 默認為背景
       categorie['name'] = label[1]
       return categorie

   def annotation(self,points,label,num):
       annotation={}
       annotation['segmentation']=[list(np.asarray(points).flatten())]
       annotation['iscrowd'] = 0
       annotation['image_id'] = num+1
       # annotation['bbox'] = str(self.getbbox(points)) # 使用list保存json文件時報錯（不知道為什么）
       # list(map(int,a[1:-1].split(','))) a=annotation['bbox'] 使用該方式轉成list
       annotation['bbox'] = list(map(float,self.getbbox(points)))

       annotation['category_id'] = self.getcatid(label)
       annotation['id'] = self.annID
       return annotation

注：這里只實現images、categories、annotations三個字段內容，因為只用到這幾個字段

可視化數據

這部分是使用COCO的API接口打開剛才自己生成的JSON文件，以驗證是否存在問題。

visualization.py

# -*- coding:utf-8 -*-

from __future__ import print_function
from pycocotools.coco import COCO
import os, sys, zipfile
import urllib.request
import shutil
import numpy as np
import skimage.io as io
import matplotlib.pyplot as plt
import pylab
pylab.rcParams['figure.figsize'] = (8.0, 10.0)

annFile='./new.json'
coco=COCO(annFile)

# display COCO categories and supercategories
cats = coco.loadCats(coco.getCatIds())
nms=[cat['name'] for cat in cats]
print('COCO categories: \n{}\n'.format(' '.join(nms)))

nms = set([cat['supercategory'] for cat in cats])
print('COCO supercategories: \n{}'.format(' '.join(nms)))

# imgIds = coco.getImgIds(imgIds = [324158])
imgIds = coco.getImgIds()
imgId=np.random.randint(0,len(imgIds))
img = coco.loadImgs(imgIds[imgId])[0]
dataDir = '.'
# dataType = 'val2017'
# I = io.imread('%s/%s/%s'%(dataDir,dataType,img['file_name']))
I = io.imread('%s/%s'%(dataDir,img['file_name']))

plt.axis('off')
plt.imshow(I)
plt.show()


# load and display instance annotations
# 加載實例掩膜
# catIds = coco.getCatIds(catNms=['person','dog','skateboard']);
# catIds=coco.getCatIds()
catIds=[]
for ann in coco.dataset['annotations']:
    if ann['image_id']==imgIds[imgId]:
        catIds.append(ann['category_id'])

plt.imshow(I); plt.axis('off')
annIds = coco.getAnnIds(imgIds=img['id'], catIds=catIds, iscrowd=None)
anns = coco.loadAnns(annIds)
coco.showAnns(anns)
plt.show()

顯示結果：

這里寫圖片描述

Object Keypoint 類型的標注格式

運行腳本one_image_json.py 得到單張圖片的JSON信息。

基本上內容與Object Instance的標注格式一樣，不同的地方在於categories、annotations字段內容不一樣。

主要內容有：

{
    "info": { 
        "description": "COCO 2017 Dataset",
        "url": "http://cocodataset.org",
        "version": "1.0",
        "year": 2017,
        "contributor": "COCO Consortium",
        "date_created": "2017/09/01"
    },
    "licenses": [
        {
            "url": "http://creativecommons.org/licenses/by-nc-sa/2.0/",
            "id": 1,
            "name": "Attribution-NonCommercial-ShareAlike License"
        },
        ……
        ……
    ],
    "images": [
        {
            "license": 4,
            "file_name": "000000397133.jpg", # 圖片名
            "coco_url": "http://images.cocodataset.org/val2017/000000397133.jpg", # coco 鏈接地址
            "height": 427, # 高
            "width": 640, # 寬
            "date_captured": "2013-11-14 17:02:52", # 獲取日期
            "flickr_url": "http://farm7.staticflickr.com/6116/6255196340_da26cf2c9e_z.jpg", # flickr 鏈接地址
            "id": 397133 # 圖片ID（每張圖片ID唯一）
        }
    ],
    "categories": [
        {
            "supercategory": "person", # 主類
            "id": 1,  # class id
            "name": "person", # 子類（具體類別）
            "keypoints": [ # 相比Object Instance多了這個字段
                "nose",
                "left_eye",
                "right_eye",
                "left_ear",
                "right_ear",
                "left_shoulder",
                "right_shoulder",
                "left_elbow",
                "right_elbow",
                "left_wrist",
                "right_wrist",
                "left_hip",
                "right_hip",
                "left_knee",
                "right_knee",
                "left_ankle",
                "right_ankle"
            ],
            "skeleton": [ # 骨架
                [
                    16,14
                ],
                [
                    14,12
                ],
               ……
               ……
                [
                    5,7
                ]
            ]
        }
    ],
    "annotations": [
        {
            "segmentation": [
                [
                    446.71,70.66, # 多邊形(對象mask)第一個點 x，y
                    466.07,72.89,
                    471.28,78.85,
                    473.51,88.52,
                    473.51,98.2,
                   ……
                   ……
                    443.74,69.92
                ]
            ],
            "num_keypoints": 13, # 關鍵點數
            "area": 17376.91885,
            "iscrowd": 0,
            "keypoints": [
                # v=0 表示這個關鍵點沒有標注（這種情況下x=y=v=0）
                # v=1 表示這個關鍵點標注了但是不可見(被遮擋了）
                # v=2 表示這個關鍵點標注了同時也可見
                433,94,2, # x,y,v 
                434,90,2,
                0,0,0,
                443,98,2,
                0,0,0,
                ……
                ……
            ],
            "image_id": 397133, # 對應的圖片ID
            "bbox": [
                388.66,69.92,109.41,277.62 # [x,y,w,h] 對象定位框
            ],
            "category_id": 1, # 類別id
            "id": 200887 # 對象id（每個對象id都是唯一的，即不能出現重復）
        },
        ……
        ……
    ]
}

Image Caption的標注格式

運行腳本one_image_json.py 得到單張圖片的JSON信息。

基本上內容與Object Instance的標注格式一樣，不同的地方在於annotations字段內容不一樣以及沒有categories字段

{
    "info": {
        "description": "COCO 2017 Dataset",
        "url": "http://cocodataset.org",
        "version": "1.0",
        "year": 2017,
        "contributor": "COCO Consortium",
        "date_created": "2017/09/01"
    },
    "licenses": [
        {
            "url": "http://creativecommons.org/licenses/by-nc-sa/2.0/",
            "id": 1,
            "name": "Attribution-NonCommercial-ShareAlike License"
        },
       ……
       ……
    ],
    "images": [
        {
            "license": 4,
            "file_name": "000000397133.jpg",
            "coco_url": "http://images.cocodataset.org/val2017/000000397133.jpg",
            "height": 427,
            "width": 640,
            "date_captured": "2013-11-14 17:02:52",
            "flickr_url": "http://farm7.staticflickr.com/6116/6255196340_da26cf2c9e_z.jpg",
            "id": 397133
        }
    ],
    "annotations": [
        {
            "image_id": 397133, # 圖片ID（唯一）
            "id": 370509, # 對象ID（唯一） （沒有類別ID）
            "caption": "A man is in a kitchen making pizzas." # 圖片描述
        },
    ……
    ……  
        {
            "image_id": 397133,
            "id": 375891,
            "caption": "A table with pies being made and a person standing near a wall with pots and pans hanging on the wall."
        }
    ]
}

這三種標注的info，licenses，images的內容是一樣的。

免責聲明！

本站轉載的文章為個人學習借鑒使用，本站對版權不負任何法律責任。如果侵犯了您的隱私權益，請聯系本站郵箱yoyou2525@163.com刪除。

猜您在找 MS coco中image_caption的數據格式詳解 MS coco數據集下載 MS COCO數據集格式 MS COCO 數據集學習筆記（Common Objects in COntext）自制 COCO api 直接讀取類 COCO 的標注數據的壓縮文件 coco標注信息與labelme標注信息的詳解、相互轉換及可視化將彩色RGB分割標注圖像數據集轉換為COCO格式的JSON文件 coco數據集標注圖轉為二值圖python（附代碼） CrowdHuman數據集標注格式轉換為YOLOv3可以使用的COCO格式 coco數據集標注文件json格式化查看

MS COCO數據標注詳解

JSON文件

打開JSON文件查看數據特點

Object Instance 類型的標注格式

info

licenses

images

categories

annotations

可視化

仿照COCO JSON文件

首先是要labelme做好圖片標注

將labelme的JSON轉成COCO格式JSON

可視化數據

Object Keypoint 類型的標注格式

Image Caption的標注格式

免責聲明！

首先是要`labelme`做好圖片標注