├── VOCdevkit
    └── VOC2007
    │   ├── JPEGImages
    │       ├── 0.jpg
    │       ├── 1.jpg
    │       ├── 2.jpg
    │       ├── 3.jpg
    │       └── 4.jpg
    │   └── Annotations
    │       ├── 0.xml
    │       ├── 2.xml
    │       ├── 3.xml
    │       ├── 1.xml
    │       └── 4.xml
├── VOCdevkit_Origin
    └── VOC2007
    │   ├── JPEGImages
    │       ├── 000001.jpg
    │       ├── 000002.jpg
    │       ├── 000003.jpg
    │       ├── 000004.jpg
    │       └── 000005.jpg
    │   └── Annotations
    │       ├── 000002.xml
    │       ├── 000003.xml
    │       ├── 000001.xml
    │       ├── 000005.xml
    │       └── 000004.xml
├── README.md
├── LICENSE
├── utils
    ├── utils.py
    └── random_data.py
├── test_get_random_data.py
├── test_mosaic.py
├── .gitignore
├── test_mixup.py
├── generate_get_random_data.py
├── generate_mosaic.py
└── generate_mixup.py


/VOCdevkit/VOC2007/JPEGImages/0.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bubbliiiing/object-detection-augmentation/HEAD/VOCdevkit/VOC2007/JPEGImages/0.jpg


--------------------------------------------------------------------------------
/VOCdevkit/VOC2007/JPEGImages/1.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bubbliiiing/object-detection-augmentation/HEAD/VOCdevkit/VOC2007/JPEGImages/1.jpg


--------------------------------------------------------------------------------
/VOCdevkit/VOC2007/JPEGImages/2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bubbliiiing/object-detection-augmentation/HEAD/VOCdevkit/VOC2007/JPEGImages/2.jpg


--------------------------------------------------------------------------------
/VOCdevkit/VOC2007/JPEGImages/3.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bubbliiiing/object-detection-augmentation/HEAD/VOCdevkit/VOC2007/JPEGImages/3.jpg


--------------------------------------------------------------------------------
/VOCdevkit/VOC2007/JPEGImages/4.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bubbliiiing/object-detection-augmentation/HEAD/VOCdevkit/VOC2007/JPEGImages/4.jpg


--------------------------------------------------------------------------------
/VOCdevkit_Origin/VOC2007/JPEGImages/000001.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bubbliiiing/object-detection-augmentation/HEAD/VOCdevkit_Origin/VOC2007/JPEGImages/000001.jpg


--------------------------------------------------------------------------------
/VOCdevkit_Origin/VOC2007/JPEGImages/000002.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bubbliiiing/object-detection-augmentation/HEAD/VOCdevkit_Origin/VOC2007/JPEGImages/000002.jpg


--------------------------------------------------------------------------------
/VOCdevkit_Origin/VOC2007/JPEGImages/000003.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bubbliiiing/object-detection-augmentation/HEAD/VOCdevkit_Origin/VOC2007/JPEGImages/000003.jpg


--------------------------------------------------------------------------------
/VOCdevkit_Origin/VOC2007/JPEGImages/000004.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bubbliiiing/object-detection-augmentation/HEAD/VOCdevkit_Origin/VOC2007/JPEGImages/000004.jpg


--------------------------------------------------------------------------------
/VOCdevkit_Origin/VOC2007/JPEGImages/000005.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/bubbliiiing/object-detection-augmentation/HEAD/VOCdevkit_Origin/VOC2007/JPEGImages/000005.jpg


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | ## object-detection-augmentation-这里面存放了一些目标检测算法的数据增强方法。如mosaic、mixup。
 2 | ---
 3 | 
 4 | ## 目录
 5 | 1. [数据增强测试](#数据增强测试)
 6 | 2. [生成图片与标签](#生成图片与标签)
 7 | 
 8 | ## 数据增强测试
 9 | 以test开头的几个py文件用于测试不同的数据增强方法。
10 | ### 测试步骤
11 | 1、Origin_VOCdevkit_path用于指定VOC数据集所在的文件夹；       
12 | 2、input_shape代表数据增强后的图片的大小；     
13 | 3、运行test_*.py即可查看对应的数据增强效果。     
14 | 
15 | ## 标签处理
16 | 以generate开头的几个py文件用于生成并保存数据增强后的标签与图片。
17 | ### 生成步骤
18 | 1、Origin_VOCdevkit_path用于指定需要增强的数据集路径；     
19 | 2、Out_VOCdevkit_path用于指定输出的数据集路径；     
20 | 3、Out_Num用于增强生成多少张图片；    
21 | 4、input_shape代表数据增强后的图片的大小；       
22 | 5、运行generate_*.py即可生成并保存数据增强后的标签与图片。


--------------------------------------------------------------------------------
/VOCdevkit_Origin/VOC2007/Annotations/000002.xml:
--------------------------------------------------------------------------------
 1 | <annotation>
 2 | 	<folder>VOC2007</folder>
 3 | 	<filename>000002.jpg</filename>
 4 | 	<source>
 5 | 		<database>The VOC2007 Database</database>
 6 | 		<annotation>PASCAL VOC2007</annotation>
 7 | 		<image>flickr</image>
 8 | 		<flickrid>329145082</flickrid>
 9 | 	</source>
10 | 	<owner>
11 | 		<flickrid>hiromori2</flickrid>
12 | 		<name>Hiroyuki Mori</name>
13 | 	</owner>
14 | 	<size>
15 | 		<width>335</width>
16 | 		<height>500</height>
17 | 		<depth>3</depth>
18 | 	</size>
19 | 	<segmented>0</segmented>
20 | 	<object>
21 | 		<name>train</name>
22 | 		<pose>Unspecified</pose>
23 | 		<truncated>0</truncated>
24 | 		<difficult>0</difficult>
25 | 		<bndbox>
26 | 			<xmin>139</xmin>
27 | 			<ymin>200</ymin>
28 | 			<xmax>207</xmax>
29 | 			<ymax>301</ymax>
30 | 		</bndbox>
31 | 	</object>
32 | </annotation>
33 | 


--------------------------------------------------------------------------------
/VOCdevkit/VOC2007/Annotations/0.xml:
--------------------------------------------------------------------------------
 1 | <annotation>
 2 |     <folder>VOC</folder>
 3 |     <filename>VOCdevkit\VOC2007/JPEGImages\0.jpg</filename>
 4 |     <source>
 5 |         <database>My Database</database>
 6 |         <annotation>COCO</annotation>
 7 |         <image>flickr</image>
 8 |         <flickrid>NULL</flickrid>
 9 |     </source>
10 |     <owner>
11 |         <flickrid>NULL</flickrid>
12 |         <name>company</name>
13 |     </owner>
14 |     <size>
15 |         <width>640</width>
16 |         <height>640</height>
17 |         <depth>3</depth>
18 |     </size>
19 |     <segmented>0</segmented>
20 |     <object>
21 |         <name>train</name>
22 |         <pose>Unspecified</pose>
23 |         <truncated>0</truncated>
24 |         <difficult>0</difficult>
25 |         <bndbox>
26 |             <xmin>233</xmin>
27 |             <ymin>194</ymin>
28 |             <xmax>334</xmax>
29 |             <ymax>372</ymax>
30 |         </bndbox>
31 |     </object>
32 | </annotation>
33 | 


--------------------------------------------------------------------------------
/VOCdevkit_Origin/VOC2007/Annotations/000003.xml:
--------------------------------------------------------------------------------
 1 | <annotation>
 2 | 	<folder>VOC2007</folder>
 3 | 	<filename>000003.jpg</filename>
 4 | 	<source>
 5 | 		<database>The VOC2007 Database</database>
 6 | 		<annotation>PASCAL VOC2007</annotation>
 7 | 		<image>flickr</image>
 8 | 		<flickrid>138563409</flickrid>
 9 | 	</source>
10 | 	<owner>
11 | 		<flickrid>RandomEvent101</flickrid>
12 | 		<name>?</name>
13 | 	</owner>
14 | 	<size>
15 | 		<width>500</width>
16 | 		<height>375</height>
17 | 		<depth>3</depth>
18 | 	</size>
19 | 	<segmented>0</segmented>
20 | 	<object>
21 | 		<name>sofa</name>
22 | 		<pose>Unspecified</pose>
23 | 		<truncated>0</truncated>
24 | 		<difficult>0</difficult>
25 | 		<bndbox>
26 | 			<xmin>123</xmin>
27 | 			<ymin>155</ymin>
28 | 			<xmax>215</xmax>
29 | 			<ymax>195</ymax>
30 | 		</bndbox>
31 | 	</object>
32 | 	<object>
33 | 		<name>chair</name>
34 | 		<pose>Left</pose>
35 | 		<truncated>0</truncated>
36 | 		<difficult>0</difficult>
37 | 		<bndbox>
38 | 			<xmin>239</xmin>
39 | 			<ymin>156</ymin>
40 | 			<xmax>307</xmax>
41 | 			<ymax>205</ymax>
42 | 		</bndbox>
43 | 	</object>
44 | </annotation>
45 | 


--------------------------------------------------------------------------------
/VOCdevkit_Origin/VOC2007/Annotations/000001.xml:
--------------------------------------------------------------------------------
 1 | <annotation>
 2 | 	<folder>VOC2007</folder>
 3 | 	<filename>000001.jpg</filename>
 4 | 	<source>
 5 | 		<database>The VOC2007 Database</database>
 6 | 		<annotation>PASCAL VOC2007</annotation>
 7 | 		<image>flickr</image>
 8 | 		<flickrid>341012865</flickrid>
 9 | 	</source>
10 | 	<owner>
11 | 		<flickrid>Fried Camels</flickrid>
12 | 		<name>Jinky the Fruit Bat</name>
13 | 	</owner>
14 | 	<size>
15 | 		<width>353</width>
16 | 		<height>500</height>
17 | 		<depth>3</depth>
18 | 	</size>
19 | 	<segmented>0</segmented>
20 | 	<object>
21 | 		<name>dog</name>
22 | 		<pose>Left</pose>
23 | 		<truncated>1</truncated>
24 | 		<difficult>0</difficult>
25 | 		<bndbox>
26 | 			<xmin>48</xmin>
27 | 			<ymin>240</ymin>
28 | 			<xmax>195</xmax>
29 | 			<ymax>371</ymax>
30 | 		</bndbox>
31 | 	</object>
32 | 	<object>
33 | 		<name>person</name>
34 | 		<pose>Left</pose>
35 | 		<truncated>1</truncated>
36 | 		<difficult>0</difficult>
37 | 		<bndbox>
38 | 			<xmin>8</xmin>
39 | 			<ymin>12</ymin>
40 | 			<xmax>352</xmax>
41 | 			<ymax>498</ymax>
42 | 		</bndbox>
43 | 	</object>
44 | </annotation>
45 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2022 Bubbliiiing
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/VOCdevkit/VOC2007/Annotations/2.xml:
--------------------------------------------------------------------------------
 1 | <annotation>
 2 |     <folder>VOC</folder>
 3 |     <filename>VOCdevkit\VOC2007/JPEGImages\2.jpg</filename>
 4 |     <source>
 5 |         <database>My Database</database>
 6 |         <annotation>COCO</annotation>
 7 |         <image>flickr</image>
 8 |         <flickrid>NULL</flickrid>
 9 |     </source>
10 |     <owner>
11 |         <flickrid>NULL</flickrid>
12 |         <name>company</name>
13 |     </owner>
14 |     <size>
15 |         <width>640</width>
16 |         <height>640</height>
17 |         <depth>3</depth>
18 |     </size>
19 |     <segmented>0</segmented>
20 |     <object>
21 |         <name>chair</name>
22 |         <pose>Unspecified</pose>
23 |         <truncated>0</truncated>
24 |         <difficult>0</difficult>
25 |         <bndbox>
26 |             <xmin>149</xmin>
27 |             <ymin>180</ymin>
28 |             <xmax>307</xmax>
29 |             <ymax>296</ymax>
30 |         </bndbox>
31 |     </object>
32 |     <object>
33 |         <name>sofa</name>
34 |         <pose>Unspecified</pose>
35 |         <truncated>0</truncated>
36 |         <difficult>0</difficult>
37 |         <bndbox>
38 |             <xmin>363</xmin>
39 |             <ymin>178</ymin>
40 |             <xmax>577</xmax>
41 |             <ymax>272</ymax>
42 |         </bndbox>
43 |     </object>
44 | </annotation>
45 | 


--------------------------------------------------------------------------------
/VOCdevkit/VOC2007/Annotations/3.xml:
--------------------------------------------------------------------------------
 1 | <annotation>
 2 |     <folder>VOC</folder>
 3 |     <filename>VOCdevkit\VOC2007/JPEGImages\3.jpg</filename>
 4 |     <source>
 5 |         <database>My Database</database>
 6 |         <annotation>COCO</annotation>
 7 |         <image>flickr</image>
 8 |         <flickrid>NULL</flickrid>
 9 |     </source>
10 |     <owner>
11 |         <flickrid>NULL</flickrid>
12 |         <name>company</name>
13 |     </owner>
14 |     <size>
15 |         <width>640</width>
16 |         <height>640</height>
17 |         <depth>3</depth>
18 |     </size>
19 |     <segmented>0</segmented>
20 |     <object>
21 |         <name>dog</name>
22 |         <pose>Unspecified</pose>
23 |         <truncated>0</truncated>
24 |         <difficult>0</difficult>
25 |         <bndbox>
26 |             <xmin>275</xmin>
27 |             <ymin>405</ymin>
28 |             <xmax>395</xmax>
29 |             <ymax>515</ymax>
30 |         </bndbox>
31 |     </object>
32 |     <object>
33 |         <name>person</name>
34 |         <pose>Unspecified</pose>
35 |         <truncated>0</truncated>
36 |         <difficult>0</difficult>
37 |         <bndbox>
38 |             <xmin>146</xmin>
39 |             <ymin>213</ymin>
40 |             <xmax>428</xmax>
41 |             <ymax>622</ymax>
42 |         </bndbox>
43 |     </object>
44 | </annotation>
45 | 


--------------------------------------------------------------------------------
/utils/utils.py:
--------------------------------------------------------------------------------
 1 | import copy
 2 | import os
 3 | import xml.etree.ElementTree as ET
 4 | 
 5 | def get_classes(sample_xmls, Origin_Annotations_path):
 6 |     unique_labels  = []
 7 |     for xml in sample_xmls:
 8 |         in_file = open(os.path.join(Origin_Annotations_path, xml), encoding='utf-8')
 9 |         tree    = ET.parse(in_file)
10 |         root    = tree.getroot()
11 |         
12 |         for obj in root.iter('object'):
13 |             cls     = obj.find('name').text
14 |             if cls not in unique_labels:
15 |                 unique_labels.append(cls)
16 |     return unique_labels
17 | 
18 | def convert_annotation(jpg_path, xml_path, classes):
19 |     in_file = open(xml_path, encoding='utf-8')
20 |     tree    = ET.parse(in_file)
21 |     root    = tree.getroot()
22 |     
23 |     line = copy.deepcopy(jpg_path)
24 |     for obj in root.iter('object'):
25 |         difficult = 0 
26 |         if obj.find('difficult')!=None and hasattr(obj, "text"):
27 |             difficult = obj.find('difficult').text
28 |         if int(difficult)==1:
29 |             continue
30 |         
31 |         cls     = obj.find('name').text
32 |         cls_id = classes.index(cls)
33 |         
34 |         xmlbox  = obj.find('bndbox')
35 |         b       = (int(float(xmlbox.find('xmin').text)), int(float(xmlbox.find('ymin').text)), int(float(xmlbox.find('xmax').text)), int(float(xmlbox.find('ymax').text)))
36 |         
37 |         line += " " + ",".join([str(a) for a in b]) + ',' + str(cls_id)
38 |     return line


--------------------------------------------------------------------------------
/VOCdevkit_Origin/VOC2007/Annotations/000005.xml:
--------------------------------------------------------------------------------
 1 | <annotation>
 2 | 	<folder>VOC2007</folder>
 3 | 	<filename>000005.jpg</filename>
 4 | 	<source>
 5 | 		<database>The VOC2007 Database</database>
 6 | 		<annotation>PASCAL VOC2007</annotation>
 7 | 		<image>flickr</image>
 8 | 		<flickrid>325991873</flickrid>
 9 | 	</source>
10 | 	<owner>
11 | 		<flickrid>archintent louisville</flickrid>
12 | 		<name>?</name>
13 | 	</owner>
14 | 	<size>
15 | 		<width>500</width>
16 | 		<height>375</height>
17 | 		<depth>3</depth>
18 | 	</size>
19 | 	<segmented>0</segmented>
20 | 	<object>
21 | 		<name>chair</name>
22 | 		<pose>Rear</pose>
23 | 		<truncated>0</truncated>
24 | 		<difficult>0</difficult>
25 | 		<bndbox>
26 | 			<xmin>263</xmin>
27 | 			<ymin>211</ymin>
28 | 			<xmax>324</xmax>
29 | 			<ymax>339</ymax>
30 | 		</bndbox>
31 | 	</object>
32 | 	<object>
33 | 		<name>chair</name>
34 | 		<pose>Unspecified</pose>
35 | 		<truncated>0</truncated>
36 | 		<difficult>0</difficult>
37 | 		<bndbox>
38 | 			<xmin>165</xmin>
39 | 			<ymin>264</ymin>
40 | 			<xmax>253</xmax>
41 | 			<ymax>372</ymax>
42 | 		</bndbox>
43 | 	</object>
44 | 	<object>
45 | 		<name>chair</name>
46 | 		<pose>Unspecified</pose>
47 | 		<truncated>1</truncated>
48 | 		<difficult>1</difficult>
49 | 		<bndbox>
50 | 			<xmin>5</xmin>
51 | 			<ymin>244</ymin>
52 | 			<xmax>67</xmax>
53 | 			<ymax>374</ymax>
54 | 		</bndbox>
55 | 	</object>
56 | 	<object>
57 | 		<name>chair</name>
58 | 		<pose>Unspecified</pose>
59 | 		<truncated>0</truncated>
60 | 		<difficult>0</difficult>
61 | 		<bndbox>
62 | 			<xmin>241</xmin>
63 | 			<ymin>194</ymin>
64 | 			<xmax>295</xmax>
65 | 			<ymax>299</ymax>
66 | 		</bndbox>
67 | 	</object>
68 | 	<object>
69 | 		<name>chair</name>
70 | 		<pose>Unspecified</pose>
71 | 		<truncated>1</truncated>
72 | 		<difficult>1</difficult>
73 | 		<bndbox>
74 | 			<xmin>277</xmin>
75 | 			<ymin>186</ymin>
76 | 			<xmax>312</xmax>
77 | 			<ymax>220</ymax>
78 | 		</bndbox>
79 | 	</object>
80 | </annotation>
81 | 


--------------------------------------------------------------------------------
/test_get_random_data.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | from random import sample
 3 | 
 4 | import numpy as np
 5 | from PIL import Image, ImageDraw
 6 | 
 7 | from utils.random_data import get_random_data, get_random_data_with_MixUp
 8 | from utils.utils import convert_annotation, get_classes
 9 | 
10 | #-----------------------------------------------------------------------------------#
11 | #   Origin_VOCdevkit_path   原始数据集所在的路径
12 | #-----------------------------------------------------------------------------------#
13 | Origin_VOCdevkit_path   = "VOCdevkit_Origin"
14 | #-----------------------------------------------------------------------------------#
15 | #   input_shape             生成的图片大小。
16 | #-----------------------------------------------------------------------------------#
17 | input_shape             = [640, 640]
18 | 
19 | if __name__ == "__main__":
20 |     Origin_JPEGImages_path  = os.path.join(Origin_VOCdevkit_path, "VOC2007/JPEGImages")
21 |     Origin_Annotations_path = os.path.join(Origin_VOCdevkit_path, "VOC2007/Annotations")
22 |     
23 |     #---------------------------#
24 |     #   遍历标签并赋值
25 |     #---------------------------#
26 |     xml_names = os.listdir(Origin_Annotations_path)
27 | 
28 |     #------------------------------#
29 |     #   获取一个图像与标签
30 |     #------------------------------#
31 |     sample_xmls     = sample(xml_names, 1)
32 |     unique_labels   = get_classes(sample_xmls, Origin_Annotations_path)
33 |     
34 |     jpg_name        = os.path.join(Origin_JPEGImages_path, os.path.splitext(sample_xmls[0])[0] + '.jpg')
35 |     xml_name        = os.path.join(Origin_Annotations_path, sample_xmls[0])
36 |     
37 |     line = convert_annotation(jpg_name, xml_name, unique_labels)
38 | 
39 |     #------------------------------#
40 |     #   各自数据增强
41 |     #------------------------------#
42 |     image_data, box_data  = get_random_data(line, input_shape) 
43 |     
44 |     img = Image.fromarray(image_data.astype(np.uint8))
45 |     for j in range(len(box_data)):
46 |         thickness = 3
47 |         left, top, right, bottom  = box_data[j][0:4]
48 |         draw = ImageDraw.Draw(img)
49 |         for i in range(thickness):
50 |             draw.rectangle([left + i, top + i, right - i, bottom - i],outline=(255, 255, 255))
51 |     img.show()
52 | 


--------------------------------------------------------------------------------
/test_mosaic.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | from random import sample
 3 | 
 4 | import numpy as np
 5 | from PIL import Image, ImageDraw
 6 | 
 7 | from utils.random_data import get_random_data, get_random_data_with_Mosaic
 8 | from utils.utils import convert_annotation, get_classes
 9 | 
10 | #-----------------------------------------------------------------------------------#
11 | #   Origin_VOCdevkit_path   原始数据集所在的路径
12 | #-----------------------------------------------------------------------------------#
13 | Origin_VOCdevkit_path   = "VOCdevkit_Origin"
14 | #-----------------------------------------------------------------------------------#
15 | #   input_shape             生成的图片大小。
16 | #-----------------------------------------------------------------------------------#
17 | input_shape             = [640, 640]
18 | 
19 | if __name__ == "__main__":
20 |     Origin_JPEGImages_path  = os.path.join(Origin_VOCdevkit_path, "VOC2007/JPEGImages")
21 |     Origin_Annotations_path = os.path.join(Origin_VOCdevkit_path, "VOC2007/Annotations")
22 |     
23 |     #---------------------------#
24 |     #   遍历标签并赋值
25 |     #---------------------------#
26 |     xml_names = os.listdir(Origin_Annotations_path)
27 | 
28 |     #------------------------------#
29 |     #   获取4个图像与标签
30 |     #------------------------------#
31 |     sample_xmls     = sample(xml_names, 4)
32 |     unique_labels   = get_classes(sample_xmls, Origin_Annotations_path)
33 |     
34 |     annotation_line = []
35 |     for xml in sample_xmls:
36 |         line = convert_annotation(os.path.join(Origin_JPEGImages_path, os.path.splitext(xml)[0] + '.jpg'), os.path.join(Origin_Annotations_path, xml), unique_labels)
37 |         annotation_line.append(line)
38 | 
39 |     #------------------------------#
40 |     #   合并mosaic
41 |     #------------------------------#
42 |     image_data, box_data = get_random_data_with_Mosaic(annotation_line, input_shape)
43 |     
44 |     img = Image.fromarray(image_data.astype(np.uint8))
45 |     for j in range(len(box_data)):
46 |         thickness = 3
47 |         left, top, right, bottom  = box_data[j][0:4]
48 |         draw = ImageDraw.Draw(img)
49 |         for i in range(thickness):
50 |             draw.rectangle([left + i, top + i, right - i, bottom - i],outline=(255, 255, 255))
51 |     img.show()
52 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | *.jpg
  2 | *.xml
  3 | 
  4 | # Byte-compiled / optimized / DLL files
  5 | __pycache__/
  6 | *.py[cod]
  7 | *$py.class
  8 | 
  9 | # C extensions
 10 | *.so
 11 | 
 12 | # Distribution / packaging
 13 | .Python
 14 | build/
 15 | develop-eggs/
 16 | dist/
 17 | downloads/
 18 | eggs/
 19 | .eggs/
 20 | lib/
 21 | lib64/
 22 | parts/
 23 | sdist/
 24 | var/
 25 | wheels/
 26 | pip-wheel-metadata/
 27 | share/python-wheels/
 28 | *.egg-info/
 29 | .installed.cfg
 30 | *.egg
 31 | MANIFEST
 32 | 
 33 | # PyInstaller
 34 | #  Usually these files are written by a python script from a template
 35 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 36 | *.manifest
 37 | *.spec
 38 | 
 39 | # Installer logs
 40 | pip-log.txt
 41 | pip-delete-this-directory.txt
 42 | 
 43 | # Unit test / coverage reports
 44 | htmlcov/
 45 | .tox/
 46 | .nox/
 47 | .coverage
 48 | .coverage.*
 49 | .cache
 50 | nosetests.xml
 51 | coverage.xml
 52 | *.cover
 53 | *.py,cover
 54 | .hypothesis/
 55 | .pytest_cache/
 56 | 
 57 | # Translations
 58 | *.mo
 59 | *.pot
 60 | 
 61 | # Django stuff:
 62 | *.log
 63 | local_settings.py
 64 | db.sqlite3
 65 | db.sqlite3-journal
 66 | 
 67 | # Flask stuff:
 68 | instance/
 69 | .webassets-cache
 70 | 
 71 | # Scrapy stuff:
 72 | .scrapy
 73 | 
 74 | # Sphinx documentation
 75 | docs/_build/
 76 | 
 77 | # PyBuilder
 78 | target/
 79 | 
 80 | # Jupyter Notebook
 81 | .ipynb_checkpoints
 82 | 
 83 | # IPython
 84 | profile_default/
 85 | ipython_config.py
 86 | 
 87 | # pyenv
 88 | .python-version
 89 | 
 90 | # pipenv
 91 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
 92 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
 93 | #   having no cross-platform support, pipenv may install dependencies that don't work, or not
 94 | #   install all needed dependencies.
 95 | #Pipfile.lock
 96 | 
 97 | # PEP 582; used by e.g. github.com/David-OConnor/pyflow
 98 | __pypackages__/
 99 | 
100 | # Celery stuff
101 | celerybeat-schedule
102 | celerybeat.pid
103 | 
104 | # SageMath parsed files
105 | *.sage.py
106 | 
107 | # Environments
108 | .env
109 | .venv
110 | env/
111 | venv/
112 | ENV/
113 | env.bak/
114 | venv.bak/
115 | 
116 | # Spyder project settings
117 | .spyderproject
118 | .spyproject
119 | 
120 | # Rope project settings
121 | .ropeproject
122 | 
123 | # mkdocs documentation
124 | /site
125 | 
126 | # mypy
127 | .mypy_cache/
128 | .dmypy.json
129 | dmypy.json
130 | 
131 | # Pyre type checker
132 | .pyre/
133 | 


--------------------------------------------------------------------------------
/VOCdevkit_Origin/VOC2007/Annotations/000004.xml:
--------------------------------------------------------------------------------
  1 | <annotation>
  2 | 	<folder>VOC2007</folder>
  3 | 	<filename>000004.jpg</filename>
  4 | 	<source>
  5 | 		<database>The VOC2007 Database</database>
  6 | 		<annotation>PASCAL VOC2007</annotation>
  7 | 		<image>flickr</image>
  8 | 		<flickrid>322032655</flickrid>
  9 | 	</source>
 10 | 	<owner>
 11 | 		<flickrid>paytonc</flickrid>
 12 | 		<name>Payton Chung</name>
 13 | 	</owner>
 14 | 	<size>
 15 | 		<width>500</width>
 16 | 		<height>406</height>
 17 | 		<depth>3</depth>
 18 | 	</size>
 19 | 	<segmented>0</segmented>
 20 | 	<object>
 21 | 		<name>car</name>
 22 | 		<pose>Frontal</pose>
 23 | 		<truncated>0</truncated>
 24 | 		<difficult>0</difficult>
 25 | 		<bndbox>
 26 | 			<xmin>13</xmin>
 27 | 			<ymin>311</ymin>
 28 | 			<xmax>84</xmax>
 29 | 			<ymax>362</ymax>
 30 | 		</bndbox>
 31 | 	</object>
 32 | 	<object>
 33 | 		<name>car</name>
 34 | 		<pose>Unspecified</pose>
 35 | 		<truncated>1</truncated>
 36 | 		<difficult>0</difficult>
 37 | 		<bndbox>
 38 | 			<xmin>362</xmin>
 39 | 			<ymin>330</ymin>
 40 | 			<xmax>500</xmax>
 41 | 			<ymax>389</ymax>
 42 | 		</bndbox>
 43 | 	</object>
 44 | 	<object>
 45 | 		<name>car</name>
 46 | 		<pose>Unspecified</pose>
 47 | 		<truncated>0</truncated>
 48 | 		<difficult>0</difficult>
 49 | 		<bndbox>
 50 | 			<xmin>235</xmin>
 51 | 			<ymin>328</ymin>
 52 | 			<xmax>334</xmax>
 53 | 			<ymax>375</ymax>
 54 | 		</bndbox>
 55 | 	</object>
 56 | 	<object>
 57 | 		<name>car</name>
 58 | 		<pose>Unspecified</pose>
 59 | 		<truncated>0</truncated>
 60 | 		<difficult>0</difficult>
 61 | 		<bndbox>
 62 | 			<xmin>175</xmin>
 63 | 			<ymin>327</ymin>
 64 | 			<xmax>252</xmax>
 65 | 			<ymax>364</ymax>
 66 | 		</bndbox>
 67 | 	</object>
 68 | 	<object>
 69 | 		<name>car</name>
 70 | 		<pose>Unspecified</pose>
 71 | 		<truncated>0</truncated>
 72 | 		<difficult>0</difficult>
 73 | 		<bndbox>
 74 | 			<xmin>139</xmin>
 75 | 			<ymin>320</ymin>
 76 | 			<xmax>189</xmax>
 77 | 			<ymax>359</ymax>
 78 | 		</bndbox>
 79 | 	</object>
 80 | 	<object>
 81 | 		<name>car</name>
 82 | 		<pose>Unspecified</pose>
 83 | 		<truncated>0</truncated>
 84 | 		<difficult>0</difficult>
 85 | 		<bndbox>
 86 | 			<xmin>108</xmin>
 87 | 			<ymin>325</ymin>
 88 | 			<xmax>150</xmax>
 89 | 			<ymax>353</ymax>
 90 | 		</bndbox>
 91 | 	</object>
 92 | 	<object>
 93 | 		<name>car</name>
 94 | 		<pose>Unspecified</pose>
 95 | 		<truncated>0</truncated>
 96 | 		<difficult>0</difficult>
 97 | 		<bndbox>
 98 | 			<xmin>84</xmin>
 99 | 			<ymin>323</ymin>
100 | 			<xmax>121</xmax>
101 | 			<ymax>350</ymax>
102 | 		</bndbox>
103 | 	</object>
104 | </annotation>
105 | 


--------------------------------------------------------------------------------
/test_mixup.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | from random import sample
 3 | 
 4 | import numpy as np
 5 | from PIL import Image, ImageDraw
 6 | 
 7 | from utils.random_data import get_random_data, get_random_data_with_MixUp
 8 | from utils.utils import convert_annotation, get_classes
 9 | 
10 | #-----------------------------------------------------------------------------------#
11 | #   Origin_VOCdevkit_path   原始数据集所在的路径
12 | #-----------------------------------------------------------------------------------#
13 | Origin_VOCdevkit_path   = "VOCdevkit_Origin"
14 | #-----------------------------------------------------------------------------------#
15 | #   input_shape             生成的图片大小。
16 | #-----------------------------------------------------------------------------------#
17 | input_shape             = [640, 640]
18 | 
19 | if __name__ == "__main__":
20 |     Origin_JPEGImages_path  = os.path.join(Origin_VOCdevkit_path, "VOC2007/JPEGImages")
21 |     Origin_Annotations_path = os.path.join(Origin_VOCdevkit_path, "VOC2007/Annotations")
22 |     
23 |     #---------------------------#
24 |     #   遍历标签并赋值
25 |     #---------------------------#
26 |     xml_names = os.listdir(Origin_Annotations_path)
27 | 
28 |     #------------------------------#
29 |     #   获取两个图像与标签
30 |     #------------------------------#
31 |     sample_xmls     = sample(xml_names, 2)
32 |     unique_labels   = get_classes(sample_xmls, Origin_Annotations_path)
33 |     jpg_name_1  = os.path.join(Origin_JPEGImages_path, os.path.splitext(sample_xmls[0])[0] + '.jpg')
34 |     jpg_name_2  = os.path.join(Origin_JPEGImages_path, os.path.splitext(sample_xmls[1])[0] + '.jpg')
35 |     xml_name_1  = os.path.join(Origin_Annotations_path, sample_xmls[0])
36 |     xml_name_2  = os.path.join(Origin_Annotations_path, sample_xmls[1])
37 |     
38 |     line_1 = convert_annotation(jpg_name_1, xml_name_1, unique_labels)
39 |     line_2 = convert_annotation(jpg_name_2, xml_name_2, unique_labels)
40 | 
41 |     #------------------------------#
42 |     #   各自数据增强
43 |     #------------------------------#
44 |     image_1, box_1  = get_random_data(line_1, input_shape) 
45 |     image_2, box_2  = get_random_data(line_2, input_shape) 
46 |     
47 |     #------------------------------#
48 |     #   合并mixup
49 |     #------------------------------#
50 |     image_data, box_data = get_random_data_with_MixUp(image_1, box_1, image_2, box_2)
51 |     
52 |     img = Image.fromarray(image_data.astype(np.uint8))
53 |     for j in range(len(box_data)):
54 |         thickness = 3
55 |         left, top, right, bottom  = box_data[j][0:4]
56 |         draw = ImageDraw.Draw(img)
57 |         for i in range(thickness):
58 |             draw.rectangle([left + i, top + i, right - i, bottom - i],outline=(255, 255, 255))
59 |     img.show()
60 | 


--------------------------------------------------------------------------------
/VOCdevkit/VOC2007/Annotations/1.xml:
--------------------------------------------------------------------------------
  1 | <annotation>
  2 |     <folder>VOC</folder>
  3 |     <filename>VOCdevkit\VOC2007/JPEGImages\1.jpg</filename>
  4 |     <source>
  5 |         <database>My Database</database>
  6 |         <annotation>COCO</annotation>
  7 |         <image>flickr</image>
  8 |         <flickrid>NULL</flickrid>
  9 |     </source>
 10 |     <owner>
 11 |         <flickrid>NULL</flickrid>
 12 |         <name>company</name>
 13 |     </owner>
 14 |     <size>
 15 |         <width>640</width>
 16 |         <height>640</height>
 17 |         <depth>3</depth>
 18 |     </size>
 19 |     <segmented>0</segmented>
 20 |     <object>
 21 |         <name>car</name>
 22 |         <pose>Unspecified</pose>
 23 |         <truncated>0</truncated>
 24 |         <difficult>0</difficult>
 25 |         <bndbox>
 26 |             <xmin>12</xmin>
 27 |             <ymin>513</ymin>
 28 |             <xmax>181</xmax>
 29 |             <ymax>595</ymax>
 30 |         </bndbox>
 31 |     </object>
 32 |     <object>
 33 |         <name>car</name>
 34 |         <pose>Unspecified</pose>
 35 |         <truncated>0</truncated>
 36 |         <difficult>0</difficult>
 37 |         <bndbox>
 38 |             <xmin>476</xmin>
 39 |             <ymin>503</ymin>
 40 |             <xmax>521</xmax>
 41 |             <ymax>541</ymax>
 42 |         </bndbox>
 43 |     </object>
 44 |     <object>
 45 |         <name>car</name>
 46 |         <pose>Unspecified</pose>
 47 |         <truncated>0</truncated>
 48 |         <difficult>0</difficult>
 49 |         <bndbox>
 50 |             <xmin>440</xmin>
 51 |             <ymin>506</ymin>
 52 |             <xmax>492</xmax>
 53 |             <ymax>545</ymax>
 54 |         </bndbox>
 55 |     </object>
 56 |     <object>
 57 |         <name>car</name>
 58 |         <pose>Unspecified</pose>
 59 |         <truncated>0</truncated>
 60 |         <difficult>0</difficult>
 61 |         <bndbox>
 62 |             <xmin>215</xmin>
 63 |             <ymin>510</ymin>
 64 |             <xmax>336</xmax>
 65 |             <ymax>575</ymax>
 66 |         </bndbox>
 67 |     </object>
 68 |     <object>
 69 |         <name>car</name>
 70 |         <pose>Unspecified</pose>
 71 |         <truncated>0</truncated>
 72 |         <difficult>0</difficult>
 73 |         <bndbox>
 74 |             <xmin>393</xmin>
 75 |             <ymin>499</ymin>
 76 |             <xmax>454</xmax>
 77 |             <ymax>553</ymax>
 78 |         </bndbox>
 79 |     </object>
 80 |     <object>
 81 |         <name>car</name>
 82 |         <pose>Unspecified</pose>
 83 |         <truncated>0</truncated>
 84 |         <difficult>0</difficult>
 85 |         <bndbox>
 86 |             <xmin>521</xmin>
 87 |             <ymin>487</ymin>
 88 |             <xmax>608</xmax>
 89 |             <ymax>557</ymax>
 90 |         </bndbox>
 91 |     </object>
 92 |     <object>
 93 |         <name>car</name>
 94 |         <pose>Unspecified</pose>
 95 |         <truncated>0</truncated>
 96 |         <difficult>0</difficult>
 97 |         <bndbox>
 98 |             <xmin>316</xmin>
 99 |             <ymin>509</ymin>
100 |             <xmax>410</xmax>
101 |             <ymax>560</ymax>
102 |         </bndbox>
103 |     </object>
104 | </annotation>
105 | 


--------------------------------------------------------------------------------
/VOCdevkit/VOC2007/Annotations/4.xml:
--------------------------------------------------------------------------------
  1 | <annotation>
  2 |     <folder>VOC</folder>
  3 |     <filename>VOCdevkit\VOC2007/JPEGImages\4.jpg</filename>
  4 |     <source>
  5 |         <database>My Database</database>
  6 |         <annotation>COCO</annotation>
  7 |         <image>flickr</image>
  8 |         <flickrid>NULL</flickrid>
  9 |     </source>
 10 |     <owner>
 11 |         <flickrid>NULL</flickrid>
 12 |         <name>company</name>
 13 |     </owner>
 14 |     <size>
 15 |         <width>640</width>
 16 |         <height>640</height>
 17 |         <depth>3</depth>
 18 |     </size>
 19 |     <segmented>0</segmented>
 20 |     <object>
 21 |         <name>car</name>
 22 |         <pose>Unspecified</pose>
 23 |         <truncated>0</truncated>
 24 |         <difficult>0</difficult>
 25 |         <bndbox>
 26 |             <xmin>123</xmin>
 27 |             <ymin>285</ymin>
 28 |             <xmax>135</xmax>
 29 |             <ymax>297</ymax>
 30 |         </bndbox>
 31 |     </object>
 32 |     <object>
 33 |         <name>car</name>
 34 |         <pose>Unspecified</pose>
 35 |         <truncated>0</truncated>
 36 |         <difficult>0</difficult>
 37 |         <bndbox>
 38 |             <xmin>141</xmin>
 39 |             <ymin>284</ymin>
 40 |             <xmax>158</xmax>
 41 |             <ymax>301</ymax>
 42 |         </bndbox>
 43 |     </object>
 44 |     <object>
 45 |         <name>car</name>
 46 |         <pose>Unspecified</pose>
 47 |         <truncated>0</truncated>
 48 |         <difficult>0</difficult>
 49 |         <bndbox>
 50 |             <xmin>131</xmin>
 51 |             <ymin>286</ymin>
 52 |             <xmax>145</xmax>
 53 |             <ymax>298</ymax>
 54 |         </bndbox>
 55 |     </object>
 56 |     <object>
 57 |         <name>car</name>
 58 |         <pose>Unspecified</pose>
 59 |         <truncated>0</truncated>
 60 |         <difficult>0</difficult>
 61 |         <bndbox>
 62 |             <xmin>173</xmin>
 63 |             <ymin>287</ymin>
 64 |             <xmax>206</xmax>
 65 |             <ymax>307</ymax>
 66 |         </bndbox>
 67 |     </object>
 68 |     <object>
 69 |         <name>car</name>
 70 |         <pose>Unspecified</pose>
 71 |         <truncated>0</truncated>
 72 |         <difficult>0</difficult>
 73 |         <bndbox>
 74 |             <xmin>215</xmin>
 75 |             <ymin>288</ymin>
 76 |             <xmax>262</xmax>
 77 |             <ymax>313</ymax>
 78 |         </bndbox>
 79 |     </object>
 80 |     <object>
 81 |         <name>car</name>
 82 |         <pose>Unspecified</pose>
 83 |         <truncated>0</truncated>
 84 |         <difficult>0</difficult>
 85 |         <bndbox>
 86 |             <xmin>99</xmin>
 87 |             <ymin>280</ymin>
 88 |             <xmax>123</xmax>
 89 |             <ymax>302</ymax>
 90 |         </bndbox>
 91 |     </object>
 92 |     <object>
 93 |         <name>car</name>
 94 |         <pose>Unspecified</pose>
 95 |         <truncated>0</truncated>
 96 |         <difficult>0</difficult>
 97 |         <bndbox>
 98 |             <xmin>153</xmin>
 99 |             <ymin>287</ymin>
100 |             <xmax>179</xmax>
101 |             <ymax>303</ymax>
102 |         </bndbox>
103 |     </object>
104 | </annotation>
105 | 


--------------------------------------------------------------------------------
/generate_get_random_data.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | from random import sample
  3 | 
  4 | import numpy as np
  5 | from PIL import Image, ImageDraw
  6 | 
  7 | from utils.random_data import get_random_data, get_random_data_with_MixUp
  8 | from utils.utils import convert_annotation, get_classes
  9 | 
 10 | #-----------------------------------------------------------------------------------#
 11 | #   Origin_VOCdevkit_path   原始数据集所在的路径
 12 | #   Out_VOCdevkit_path      输出数据集所在的路径
 13 | #-----------------------------------------------------------------------------------#
 14 | Origin_VOCdevkit_path   = "VOCdevkit_Origin"
 15 | Out_VOCdevkit_path      = "VOCdevkit"
 16 | #-----------------------------------------------------------------------------------#
 17 | #   Out_Num                 生成多少组图片
 18 | #   input_shape             生成的图片大小
 19 | #-----------------------------------------------------------------------------------#
 20 | Out_Num                 = 5
 21 | input_shape             = [640, 640]
 22 | 
 23 | #-----------------------------------------------------------------------------------#
 24 | #   下面定义了xml里面的组成模块，无需改动。
 25 | #-----------------------------------------------------------------------------------#
 26 | headstr = """\
 27 | <annotation>
 28 |     <folder>VOC</folder>
 29 |     <filename>%s</filename>
 30 |     <source>
 31 |         <database>My Database</database>
 32 |         <annotation>COCO</annotation>
 33 |         <image>flickr</image>
 34 |         <flickrid>NULL</flickrid>
 35 |     </source>
 36 |     <owner>
 37 |         <flickrid>NULL</flickrid>
 38 |         <name>company</name>
 39 |     </owner>
 40 |     <size>
 41 |         <width>%d</width>
 42 |         <height>%d</height>
 43 |         <depth>%d</depth>
 44 |     </size>
 45 |     <segmented>0</segmented>
 46 | """
 47 | 
 48 | objstr = """\
 49 |     <object>
 50 |         <name>%s</name>
 51 |         <pose>Unspecified</pose>
 52 |         <truncated>0</truncated>
 53 |         <difficult>0</difficult>
 54 |         <bndbox>
 55 |             <xmin>%d</xmin>
 56 |             <ymin>%d</ymin>
 57 |             <xmax>%d</xmax>
 58 |             <ymax>%d</ymax>
 59 |         </bndbox>
 60 |     </object>
 61 | """
 62 |     
 63 | tailstr = '''\
 64 | </annotation>
 65 | '''
 66 | if __name__ == "__main__":
 67 |     Origin_JPEGImages_path  = os.path.join(Origin_VOCdevkit_path, "VOC2007/JPEGImages")
 68 |     Origin_Annotations_path = os.path.join(Origin_VOCdevkit_path, "VOC2007/Annotations")
 69 |     
 70 |     Out_JPEGImages_path  = os.path.join(Out_VOCdevkit_path, "VOC2007/JPEGImages")
 71 |     Out_Annotations_path = os.path.join(Out_VOCdevkit_path, "VOC2007/Annotations")
 72 |     
 73 |     if not os.path.exists(Out_JPEGImages_path):
 74 |         os.makedirs(Out_JPEGImages_path)
 75 |     if not os.path.exists(Out_Annotations_path):
 76 |         os.makedirs(Out_Annotations_path)
 77 |     #---------------------------#
 78 |     #   遍历标签并赋值
 79 |     #---------------------------#
 80 |     xml_names = os.listdir(Origin_Annotations_path)
 81 | 
 82 |     def write_xml(anno_path, jpg_pth, head, input_shape, boxes, unique_labels, tail):
 83 |         f = open(anno_path, "w")
 84 |         f.write(head%(jpg_pth, input_shape[0], input_shape[1], 3))
 85 |         for i, box in enumerate(boxes):
 86 |             f.write(objstr%(str(unique_labels[int(box[4])]), box[0], box[1], box[2], box[3]))
 87 |         f.write(tail)
 88 |     
 89 |     #------------------------------#
 90 |     #   循环生成xml和jpg
 91 |     #------------------------------#
 92 |     for index in range(Out_Num):
 93 |         #------------------------------#
 94 |         #   获取一个图像与标签
 95 |         #------------------------------#
 96 |         sample_xmls     = sample(xml_names, 1)
 97 |         unique_labels   = get_classes(sample_xmls, Origin_Annotations_path)
 98 |         
 99 |         jpg_name  = os.path.join(Origin_JPEGImages_path, os.path.splitext(sample_xmls[0])[0] + '.jpg')
100 |         xml_name  = os.path.join(Origin_Annotations_path, sample_xmls[0])
101 |             
102 |         line = convert_annotation(jpg_name, xml_name, unique_labels)
103 |         
104 |         #------------------------------#
105 |         #   各自数据增强
106 |         #------------------------------#
107 |         image_data, box_data  = get_random_data(line, input_shape) 
108 |         
109 |         img = Image.fromarray(image_data.astype(np.uint8))
110 |         img.save(os.path.join(Out_JPEGImages_path, str(index) + '.jpg'))
111 |         write_xml(os.path.join(Out_Annotations_path, str(index) + '.xml'), os.path.join(Out_JPEGImages_path, str(index) + '.jpg'), \
112 |                     headstr, input_shape, box_data, unique_labels, tailstr)
113 | 


--------------------------------------------------------------------------------
/generate_mosaic.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | from random import sample
  3 | 
  4 | import numpy as np
  5 | from PIL import Image, ImageDraw
  6 | 
  7 | from utils.random_data import get_random_data, get_random_data_with_Mosaic
  8 | from utils.utils import convert_annotation, get_classes
  9 | 
 10 | #-----------------------------------------------------------------------------------#
 11 | #   Origin_VOCdevkit_path   原始数据集所在的路径
 12 | #   Out_VOCdevkit_path      输出数据集所在的路径
 13 | #-----------------------------------------------------------------------------------#
 14 | Origin_VOCdevkit_path   = "VOCdevkit_Origin"
 15 | Out_VOCdevkit_path      = "VOCdevkit"
 16 | #-----------------------------------------------------------------------------------#
 17 | #   Out_Num                 利用mosaic生成多少组图片
 18 | #   input_shape             生成的图片大小
 19 | #-----------------------------------------------------------------------------------#
 20 | Out_Num                 = 5
 21 | input_shape             = [640, 640]
 22 | 
 23 | #-----------------------------------------------------------------------------------#
 24 | #   下面定义了xml里面的组成模块，无需改动。
 25 | #-----------------------------------------------------------------------------------#
 26 | headstr = """\
 27 | <annotation>
 28 |     <folder>VOC</folder>
 29 |     <filename>%s</filename>
 30 |     <source>
 31 |         <database>My Database</database>
 32 |         <annotation>COCO</annotation>
 33 |         <image>flickr</image>
 34 |         <flickrid>NULL</flickrid>
 35 |     </source>
 36 |     <owner>
 37 |         <flickrid>NULL</flickrid>
 38 |         <name>company</name>
 39 |     </owner>
 40 |     <size>
 41 |         <width>%d</width>
 42 |         <height>%d</height>
 43 |         <depth>%d</depth>
 44 |     </size>
 45 |     <segmented>0</segmented>
 46 | """
 47 | 
 48 | objstr = """\
 49 |     <object>
 50 |         <name>%s</name>
 51 |         <pose>Unspecified</pose>
 52 |         <truncated>0</truncated>
 53 |         <difficult>0</difficult>
 54 |         <bndbox>
 55 |             <xmin>%d</xmin>
 56 |             <ymin>%d</ymin>
 57 |             <xmax>%d</xmax>
 58 |             <ymax>%d</ymax>
 59 |         </bndbox>
 60 |     </object>
 61 | """
 62 |     
 63 | tailstr = '''\
 64 | </annotation>
 65 | '''
 66 | if __name__ == "__main__":
 67 |     Origin_JPEGImages_path  = os.path.join(Origin_VOCdevkit_path, "VOC2007/JPEGImages")
 68 |     Origin_Annotations_path = os.path.join(Origin_VOCdevkit_path, "VOC2007/Annotations")
 69 |     
 70 |     Out_JPEGImages_path  = os.path.join(Out_VOCdevkit_path, "VOC2007/JPEGImages")
 71 |     Out_Annotations_path = os.path.join(Out_VOCdevkit_path, "VOC2007/Annotations")
 72 |     
 73 |     if not os.path.exists(Out_JPEGImages_path):
 74 |         os.makedirs(Out_JPEGImages_path)
 75 |     if not os.path.exists(Out_Annotations_path):
 76 |         os.makedirs(Out_Annotations_path)
 77 |     #---------------------------#
 78 |     #   遍历标签并赋值
 79 |     #---------------------------#
 80 |     xml_names = os.listdir(Origin_Annotations_path)
 81 | 
 82 |     def write_xml(anno_path, jpg_pth, head, input_shape, boxes, unique_labels, tail):
 83 |         f = open(anno_path, "w")
 84 |         f.write(head%(jpg_pth, input_shape[0], input_shape[1], 3))
 85 |         for i, box in enumerate(boxes):
 86 |             f.write(objstr%(str(unique_labels[int(box[4])]), box[0], box[1], box[2], box[3]))
 87 |         f.write(tail)
 88 |     
 89 |     #------------------------------#
 90 |     #   循环生成xml和jpg
 91 |     #------------------------------#
 92 |     for index in range(Out_Num):
 93 |         #------------------------------#
 94 |         #   获取4个图像与标签
 95 |         #------------------------------#
 96 |         sample_xmls     = sample(xml_names, 4)
 97 |         unique_labels   = get_classes(sample_xmls, Origin_Annotations_path)
 98 | 
 99 |         annotation_line = []
100 |         for xml in sample_xmls:
101 |             line = convert_annotation(os.path.join(Origin_JPEGImages_path, os.path.splitext(xml)[0] + '.jpg'), os.path.join(Origin_Annotations_path, xml), unique_labels)
102 |             annotation_line.append(line)
103 | 
104 |         #------------------------------#
105 |         #   合并mosaic
106 |         #------------------------------#
107 |         image_data, box_data = get_random_data_with_Mosaic(annotation_line, input_shape)
108 |         
109 |         img = Image.fromarray(image_data.astype(np.uint8))
110 |         img.save(os.path.join(Out_JPEGImages_path, str(index) + '.jpg'))
111 |         write_xml(os.path.join(Out_Annotations_path, str(index) + '.xml'), os.path.join(Out_JPEGImages_path, str(index) + '.jpg'), \
112 |                     headstr, input_shape, box_data, unique_labels, tailstr)
113 | 


--------------------------------------------------------------------------------
/generate_mixup.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | from random import sample
  3 | 
  4 | import numpy as np
  5 | from PIL import Image, ImageDraw
  6 | 
  7 | from utils.random_data import get_random_data, get_random_data_with_MixUp
  8 | from utils.utils import convert_annotation, get_classes
  9 | 
 10 | #-----------------------------------------------------------------------------------#
 11 | #   Origin_VOCdevkit_path   原始数据集所在的路径
 12 | #   Out_VOCdevkit_path      输出数据集所在的路径
 13 | #-----------------------------------------------------------------------------------#
 14 | Origin_VOCdevkit_path   = "VOCdevkit_Origin"
 15 | Out_VOCdevkit_path      = "VOCdevkit"
 16 | #-----------------------------------------------------------------------------------#
 17 | #   Out_Num                 利用mixup生成多少组图片
 18 | #   input_shape             生成的图片大小
 19 | #-----------------------------------------------------------------------------------#
 20 | Out_Num                 = 100
 21 | input_shape             = [640, 640]
 22 | 
 23 | #-----------------------------------------------------------------------------------#
 24 | #   下面定义了xml里面的组成模块，无需改动。
 25 | #-----------------------------------------------------------------------------------#
 26 | headstr = """\
 27 | <annotation>
 28 |     <folder>VOC</folder>
 29 |     <filename>%s</filename>
 30 |     <source>
 31 |         <database>My Database</database>
 32 |         <annotation>COCO</annotation>
 33 |         <image>flickr</image>
 34 |         <flickrid>NULL</flickrid>
 35 |     </source>
 36 |     <owner>
 37 |         <flickrid>NULL</flickrid>
 38 |         <name>company</name>
 39 |     </owner>
 40 |     <size>
 41 |         <width>%d</width>
 42 |         <height>%d</height>
 43 |         <depth>%d</depth>
 44 |     </size>
 45 |     <segmented>0</segmented>
 46 | """
 47 | 
 48 | objstr = """\
 49 |     <object>
 50 |         <name>%s</name>
 51 |         <pose>Unspecified</pose>
 52 |         <truncated>0</truncated>
 53 |         <difficult>0</difficult>
 54 |         <bndbox>
 55 |             <xmin>%d</xmin>
 56 |             <ymin>%d</ymin>
 57 |             <xmax>%d</xmax>
 58 |             <ymax>%d</ymax>
 59 |         </bndbox>
 60 |     </object>
 61 | """
 62 |     
 63 | tailstr = '''\
 64 | </annotation>
 65 | '''
 66 | if __name__ == "__main__":
 67 |     Origin_JPEGImages_path  = os.path.join(Origin_VOCdevkit_path, "VOC2007/JPEGImages")
 68 |     Origin_Annotations_path = os.path.join(Origin_VOCdevkit_path, "VOC2007/Annotations")
 69 |     
 70 |     Out_JPEGImages_path  = os.path.join(Out_VOCdevkit_path, "VOC2007/JPEGImages")
 71 |     Out_Annotations_path = os.path.join(Out_VOCdevkit_path, "VOC2007/Annotations")
 72 |     
 73 |     if not os.path.exists(Out_JPEGImages_path):
 74 |         os.makedirs(Out_JPEGImages_path)
 75 |     if not os.path.exists(Out_Annotations_path):
 76 |         os.makedirs(Out_Annotations_path)
 77 |     #---------------------------#
 78 |     #   遍历标签并赋值
 79 |     #---------------------------#
 80 |     xml_names = os.listdir(Origin_Annotations_path)
 81 | 
 82 |     def write_xml(anno_path, jpg_pth, head, input_shape, boxes, unique_labels, tail):
 83 |         f = open(anno_path, "w")
 84 |         f.write(head%(jpg_pth, input_shape[0], input_shape[1], 3))
 85 |         for i, box in enumerate(boxes):
 86 |             f.write(objstr%(str(unique_labels[int(box[4])]), box[0], box[1], box[2], box[3]))
 87 |         f.write(tail)
 88 |     
 89 |     #------------------------------#
 90 |     #   循环生成xml和jpg
 91 |     #------------------------------#
 92 |     for index in range(Out_Num):
 93 |         #------------------------------#
 94 |         #   获取两个图像与标签
 95 |         #------------------------------#
 96 |         sample_xmls = sample(xml_names, 2)
 97 |         unique_labels = get_classes(sample_xmls, Origin_Annotations_path)
 98 | 
 99 |         jpg_name_1  = os.path.join(Origin_JPEGImages_path, os.path.splitext(sample_xmls[0])[0] + '.jpg')
100 |         jpg_name_2  = os.path.join(Origin_JPEGImages_path, os.path.splitext(sample_xmls[1])[0] + '.jpg')
101 |         xml_name_1  = os.path.join(Origin_Annotations_path, sample_xmls[0])
102 |         xml_name_2  = os.path.join(Origin_Annotations_path, sample_xmls[1])
103 |             
104 |         line_1 = convert_annotation(jpg_name_1, xml_name_1, unique_labels)
105 |         line_2 = convert_annotation(jpg_name_2, xml_name_2, unique_labels)
106 |         
107 |         #------------------------------#
108 |         #   各自数据增强
109 |         #------------------------------#
110 |         image_1, box_1  = get_random_data(line_1, input_shape) 
111 |         image_2, box_2  = get_random_data(line_2, input_shape) 
112 |         
113 |         #------------------------------#
114 |         #   合并mixup
115 |         #------------------------------#
116 |         image_data, box_data = get_random_data_with_MixUp(image_1, box_1, image_2, box_2)
117 |         
118 |         img = Image.fromarray(image_data.astype(np.uint8))
119 |         img.save(os.path.join(Out_JPEGImages_path, str(index) + '.jpg'))
120 |         write_xml(os.path.join(Out_Annotations_path, str(index) + '.xml'), os.path.join(Out_JPEGImages_path, str(index) + '.jpg'), \
121 |                     headstr, input_shape, box_data, unique_labels, tailstr)
122 | 


--------------------------------------------------------------------------------
/utils/random_data.py:
--------------------------------------------------------------------------------
  1 | import cv2
  2 | import numpy as np
  3 | from PIL import Image, ImageDraw
  4 | 
  5 | 
  6 | def rand(a=0, b=1):
  7 |     return np.random.rand()*(b-a) + a
  8 | 
  9 | def get_random_data(annotation_line, input_shape, jitter=.3, hue=.1, sat=0.7, val=0.4, random=True):
 10 |     line    = annotation_line.split()
 11 |     #------------------------------#
 12 |     #   读取图像并转换成RGB图像
 13 |     #------------------------------#
 14 |     image   = Image.open(line[0])
 15 |     image   = image.convert('RGB')
 16 | 
 17 |     #------------------------------#
 18 |     #   获得图像的高宽与目标高宽
 19 |     #------------------------------#
 20 |     iw, ih  = image.size
 21 |     h, w    = input_shape
 22 |     #------------------------------#
 23 |     #   获得预测框
 24 |     #------------------------------#
 25 |     box     = np.array([np.array(list(map(int,box.split(',')))) for box in line[1:]])
 26 | 
 27 |     if not random:
 28 |         scale = min(w/iw, h/ih)
 29 |         nw = int(iw*scale)
 30 |         nh = int(ih*scale)
 31 |         dx = (w-nw)//2
 32 |         dy = (h-nh)//2
 33 | 
 34 |         #---------------------------------#
 35 |         #   将图像多余的部分加上灰条
 36 |         #---------------------------------#
 37 |         image       = image.resize((nw,nh), Image.BICUBIC)
 38 |         new_image   = Image.new('RGB', (w,h), (128,128,128))
 39 |         new_image.paste(image, (dx, dy))
 40 |         image_data  = np.array(new_image, np.float32)
 41 | 
 42 |         #---------------------------------#
 43 |         #   对真实框进行调整
 44 |         #---------------------------------#
 45 |         if len(box)>0:
 46 |             np.random.shuffle(box)
 47 |             box[:, [0,2]] = box[:, [0,2]]*nw/iw + dx
 48 |             box[:, [1,3]] = box[:, [1,3]]*nh/ih + dy
 49 |             box[:, 0:2][box[:, 0:2]<0] = 0
 50 |             box[:, 2][box[:, 2]>w] = w
 51 |             box[:, 3][box[:, 3]>h] = h
 52 |             box_w = box[:, 2] - box[:, 0]
 53 |             box_h = box[:, 3] - box[:, 1]
 54 |             box = box[np.logical_and(box_w>1, box_h>1)] # discard invalid box
 55 | 
 56 |         return image_data, box
 57 |             
 58 |     #------------------------------------------#
 59 |     #   对图像进行缩放并且进行长和宽的扭曲
 60 |     #------------------------------------------#
 61 |     new_ar = iw/ih * rand(1-jitter,1+jitter) / rand(1-jitter,1+jitter)
 62 |     scale = rand(.25, 2)
 63 |     if new_ar < 1:
 64 |         nh = int(scale*h)
 65 |         nw = int(nh*new_ar)
 66 |     else:
 67 |         nw = int(scale*w)
 68 |         nh = int(nw/new_ar)
 69 |     image = image.resize((nw,nh), Image.BICUBIC)
 70 | 
 71 |     #------------------------------------------#
 72 |     #   将图像多余的部分加上灰条
 73 |     #------------------------------------------#
 74 |     dx = int(rand(0, w-nw))
 75 |     dy = int(rand(0, h-nh))
 76 |     new_image = Image.new('RGB', (w,h), (128,128,128))
 77 |     new_image.paste(image, (dx, dy))
 78 |     image = new_image
 79 | 
 80 |     #------------------------------------------#
 81 |     #   翻转图像
 82 |     #------------------------------------------#
 83 |     flip = rand()<.5
 84 |     if flip: image = image.transpose(Image.FLIP_LEFT_RIGHT)
 85 | 
 86 |     image_data      = np.array(image, np.uint8)
 87 |     #---------------------------------#
 88 |     #   对图像进行色域变换
 89 |     #   计算色域变换的参数
 90 |     #---------------------------------#
 91 |     r               = np.random.uniform(-1, 1, 3) * [hue, sat, val] + 1
 92 |     #---------------------------------#
 93 |     #   将图像转到HSV上
 94 |     #---------------------------------#
 95 |     hue, sat, val   = cv2.split(cv2.cvtColor(image_data, cv2.COLOR_RGB2HSV))
 96 |     dtype           = image_data.dtype
 97 |     #---------------------------------#
 98 |     #   应用变换
 99 |     #---------------------------------#
100 |     x       = np.arange(0, 256, dtype=r.dtype)
101 |     lut_hue = ((x * r[0]) % 180).astype(dtype)
102 |     lut_sat = np.clip(x * r[1], 0, 255).astype(dtype)
103 |     lut_val = np.clip(x * r[2], 0, 255).astype(dtype)
104 | 
105 |     image_data = cv2.merge((cv2.LUT(hue, lut_hue), cv2.LUT(sat, lut_sat), cv2.LUT(val, lut_val)))
106 |     image_data = cv2.cvtColor(image_data, cv2.COLOR_HSV2RGB)
107 | 
108 |     #---------------------------------#
109 |     #   对真实框进行调整
110 |     #---------------------------------#
111 |     if len(box)>0:
112 |         np.random.shuffle(box)
113 |         box[:, [0,2]] = box[:, [0,2]]*nw/iw + dx
114 |         box[:, [1,3]] = box[:, [1,3]]*nh/ih + dy
115 |         if flip: box[:, [0,2]] = w - box[:, [2,0]]
116 |         box[:, 0:2][box[:, 0:2]<0] = 0
117 |         box[:, 2][box[:, 2]>w] = w
118 |         box[:, 3][box[:, 3]>h] = h
119 |         box_w = box[:, 2] - box[:, 0]
120 |         box_h = box[:, 3] - box[:, 1]
121 |         box = box[np.logical_and(box_w>1, box_h>1)] 
122 |     
123 |     return image_data, box
124 | 
125 | def merge_bboxes(bboxes, cutx, cuty):
126 |     merge_bbox = []
127 |     for i in range(len(bboxes)):
128 |         for box in bboxes[i]:
129 |             tmp_box = []
130 |             x1, y1, x2, y2 = box[0], box[1], box[2], box[3]
131 | 
132 |             if i == 0:
133 |                 if y1 > cuty or x1 > cutx:
134 |                     continue
135 |                 if y2 >= cuty and y1 <= cuty:
136 |                     y2 = cuty
137 |                 if x2 >= cutx and x1 <= cutx:
138 |                     x2 = cutx
139 | 
140 |             if i == 1:
141 |                 if y2 < cuty or x1 > cutx:
142 |                     continue
143 |                 if y2 >= cuty and y1 <= cuty:
144 |                     y1 = cuty
145 |                 if x2 >= cutx and x1 <= cutx:
146 |                     x2 = cutx
147 | 
148 |             if i == 2:
149 |                 if y2 < cuty or x2 < cutx:
150 |                     continue
151 |                 if y2 >= cuty and y1 <= cuty:
152 |                     y1 = cuty
153 |                 if x2 >= cutx and x1 <= cutx:
154 |                     x1 = cutx
155 | 
156 |             if i == 3:
157 |                 if y1 > cuty or x2 < cutx:
158 |                     continue
159 |                 if y2 >= cuty and y1 <= cuty:
160 |                     y2 = cuty
161 |                 if x2 >= cutx and x1 <= cutx:
162 |                     x1 = cutx
163 |             tmp_box.append(x1)
164 |             tmp_box.append(y1)
165 |             tmp_box.append(x2)
166 |             tmp_box.append(y2)
167 |             tmp_box.append(box[-1])
168 |             merge_bbox.append(tmp_box)
169 |     return merge_bbox
170 | 
171 | def get_random_data_with_Mosaic(annotation_line, input_shape, jitter=0.3, hue=.1, sat=0.7, val=0.4):
172 |     h, w = input_shape
173 |     min_offset_x = rand(0.3, 0.7)
174 |     min_offset_y = rand(0.3, 0.7)
175 | 
176 |     image_datas = [] 
177 |     box_datas   = []
178 |     index       = 0
179 |     for line in annotation_line:
180 |         #---------------------------------#
181 |         #   每一行进行分割
182 |         #---------------------------------#
183 |         line_content = line.split()
184 |         #---------------------------------#
185 |         #   打开图片
186 |         #---------------------------------#
187 |         image = Image.open(line_content[0])
188 |         image = image.convert('RGB')
189 |         
190 |         #---------------------------------#
191 |         #   图片的大小
192 |         #---------------------------------#
193 |         iw, ih = image.size
194 |         #---------------------------------#
195 |         #   保存框的位置
196 |         #---------------------------------#
197 |         box = np.array([np.array(list(map(int,box.split(',')))) for box in line_content[1:]])
198 |         
199 |         #---------------------------------#
200 |         #   是否翻转图片
201 |         #---------------------------------#
202 |         flip = rand()<.5
203 |         if flip and len(box)>0:
204 |             image = image.transpose(Image.FLIP_LEFT_RIGHT)
205 |             box[:, [0,2]] = iw - box[:, [2,0]]
206 | 
207 |         #------------------------------------------#
208 |         #   对图像进行缩放并且进行长和宽的扭曲
209 |         #------------------------------------------#
210 |         new_ar = iw/ih * rand(1-jitter,1+jitter) / rand(1-jitter,1+jitter)
211 |         scale = rand(.4, 1)
212 |         if new_ar < 1:
213 |             nh = int(scale*h)
214 |             nw = int(nh*new_ar)
215 |         else:
216 |             nw = int(scale*w)
217 |             nh = int(nw/new_ar)
218 |         image = image.resize((nw, nh), Image.BICUBIC)
219 | 
220 |         #-----------------------------------------------#
221 |         #   将图片进行放置，分别对应四张分割图片的位置
222 |         #-----------------------------------------------#
223 |         if index == 0:
224 |             dx = int(w*min_offset_x) - nw
225 |             dy = int(h*min_offset_y) - nh
226 |         elif index == 1:
227 |             dx = int(w*min_offset_x) - nw
228 |             dy = int(h*min_offset_y)
229 |         elif index == 2:
230 |             dx = int(w*min_offset_x)
231 |             dy = int(h*min_offset_y)
232 |         elif index == 3:
233 |             dx = int(w*min_offset_x)
234 |             dy = int(h*min_offset_y) - nh
235 |         
236 |         new_image = Image.new('RGB', (w,h), (128,128,128))
237 |         new_image.paste(image, (dx, dy))
238 |         image_data = np.array(new_image)
239 | 
240 |         index = index + 1
241 |         box_data = []
242 |         #---------------------------------#
243 |         #   对box进行重新处理
244 |         #---------------------------------#
245 |         if len(box)>0:
246 |             np.random.shuffle(box)
247 |             box[:, [0,2]] = box[:, [0,2]]*nw/iw + dx
248 |             box[:, [1,3]] = box[:, [1,3]]*nh/ih + dy
249 |             box[:, 0:2][box[:, 0:2]<0] = 0
250 |             box[:, 2][box[:, 2]>w] = w
251 |             box[:, 3][box[:, 3]>h] = h
252 |             box_w = box[:, 2] - box[:, 0]
253 |             box_h = box[:, 3] - box[:, 1]
254 |             box = box[np.logical_and(box_w>1, box_h>1)]
255 |             box_data = np.zeros((len(box),5))
256 |             box_data[:len(box)] = box
257 |         
258 |         image_datas.append(image_data)
259 |         box_datas.append(box_data)
260 | 
261 |     #---------------------------------#
262 |     #   将图片分割，放在一起
263 |     #---------------------------------#
264 |     cutx = int(w * min_offset_x)
265 |     cuty = int(h * min_offset_y)
266 | 
267 |     new_image = np.zeros([h, w, 3])
268 |     new_image[:cuty, :cutx, :] = image_datas[0][:cuty, :cutx, :]
269 |     new_image[cuty:, :cutx, :] = image_datas[1][cuty:, :cutx, :]
270 |     new_image[cuty:, cutx:, :] = image_datas[2][cuty:, cutx:, :]
271 |     new_image[:cuty, cutx:, :] = image_datas[3][:cuty, cutx:, :]
272 | 
273 |     new_image       = np.array(new_image, np.uint8)
274 |     #---------------------------------#
275 |     #   对图像进行色域变换
276 |     #   计算色域变换的参数
277 |     #---------------------------------#
278 |     r               = np.random.uniform(-1, 1, 3) * [hue, sat, val] + 1
279 |     #---------------------------------#
280 |     #   将图像转到HSV上
281 |     #---------------------------------#
282 |     hue, sat, val   = cv2.split(cv2.cvtColor(new_image, cv2.COLOR_RGB2HSV))
283 |     dtype           = new_image.dtype
284 |     #---------------------------------#
285 |     #   应用变换
286 |     #---------------------------------#
287 |     x       = np.arange(0, 256, dtype=r.dtype)
288 |     lut_hue = ((x * r[0]) % 180).astype(dtype)
289 |     lut_sat = np.clip(x * r[1], 0, 255).astype(dtype)
290 |     lut_val = np.clip(x * r[2], 0, 255).astype(dtype)
291 | 
292 |     new_image = cv2.merge((cv2.LUT(hue, lut_hue), cv2.LUT(sat, lut_sat), cv2.LUT(val, lut_val)))
293 |     new_image = cv2.cvtColor(new_image, cv2.COLOR_HSV2RGB)
294 | 
295 |     #---------------------------------#
296 |     #   对框进行进一步的处理
297 |     #---------------------------------#
298 |     new_boxes = merge_bboxes(box_datas, cutx, cuty)
299 | 
300 |     return new_image, new_boxes
301 | 
302 | def get_random_data_with_MixUp(image_1, box_1, image_2, box_2):
303 |     new_image = np.array(image_1, np.float32) * 0.5 + np.array(image_2, np.float32) * 0.5
304 |     if len(box_1) == 0:
305 |         new_boxes = box_2
306 |     elif len(box_2) == 0:
307 |         new_boxes = box_1
308 |     else:
309 |         new_boxes = np.concatenate([box_1, box_2], axis=0)
310 |     return new_image, new_boxes
311 | 


--------------------------------------------------------------------------------