update readme and mixup

bubbliiiing · bubbliiiing · commit 2c6d8947031e · 2022-06-01T11:09:01.000+08:00
diff --git a/README.md b/README.md
@@ -23,12 +23,13 @@ BiliBili视频中的原仓库地址为：https://github.com/bubbliiiing/yolov4-t
 ## 相关仓库
 | 模型 | 路径 |
 | :----- | :----- |
-YoloV3 | https://github.com/bubbliiiing/yolo3-keras  
-Efficientnet-Yolo3 | https://github.com/bubbliiiing/efficientnet-yolo3-keras  
+YoloV3 | https://github.com/bubbliiiing/yolo3-keras  
+Efficientnet-Yolo3 | https://github.com/bubbliiiing/efficientnet-yolo3-keras  
 YoloV4 | https://github.com/bubbliiiing/yolov4-keras
 YoloV4-tiny | https://github.com/bubbliiiing/yolov4-tiny-keras
 Mobilenet-Yolov4 | https://github.com/bubbliiiing/mobilenet-yolov4-keras
-YoloV5 | https://github.com/bubbliiiing/yolov5-keras
+YoloV5-V5.0 | https://github.com/bubbliiiing/yolov5-keras
+YoloV5-V6.1 | https://github.com/bubbliiiing/yolov5-v6.1-keras
 YoloX | https://github.com/bubbliiiing/yolox-keras
 
 ## 性能情况
diff --git a/train.py b/train.py
@@ -91,18 +91,29 @@
     #   phi = 4为CA
     #-------------------------------#
     phi             = 0
-    #------------------------------------------------------#
-    #   Yolov4的tricks应用
-    #   mosaic          马赛克数据增强
-    #                   参考YoloX，由于Mosaic生成的训练图片，
-    #                   远远脱离自然图片的真实分布。
-    #                   本代码会在训练结束前的N个epoch自动关掉Mosaic
-    #                   100个世代会关闭30个世代（比例可在dataloader.py调整）
-    #   label_smoothing 标签平滑。一般0.01以下。如0.01、0.005
+    #------------------------------------------------------------------#
+    #   mosaic              马赛克数据增强。
+    #   mosaic_prob         每个step有多少概率使用mosaic数据增强，默认50%。
+    #
+    #   mixup               是否使用mixup数据增强，仅在mosaic=True时有效。
+    #                       只会对mosaic增强后的图片进行mixup的处理。
+    #   mixup_prob          有多少概率在mosaic后使用mixup数据增强，默认50%。
+    #                       总的mixup概率为mosaic_prob * mixup_prob。
+    #
+    #   special_aug_ratio   参考YoloX，由于Mosaic生成的训练图片，远远脱离自然图片的真实分布。
+    #                       当mosaic=True时，本代码会在special_aug_ratio范围内开启mosaic。
+    #                       默认为前70%个epoch，100个世代会开启70个世代。
     #
     #   余弦退火算法的参数放到下面的lr_decay_type中设置
-    #------------------------------------------------------#
-    mosaic              = False
+    #------------------------------------------------------------------#
+    mosaic              = True
+    mosaic_prob         = 0.5
+    mixup               = True
+    mixup_prob          = 0.5
+    special_aug_ratio   = 0.7
+    #------------------------------------------------------------------#
+    #   label_smoothing     标签平滑。一般0.01以下。如0.01、0.005。
+    #------------------------------------------------------------------#
     label_smoothing     = 0
 
     #----------------------------------------------------------------------------------------------------------------------------#
@@ -343,8 +354,10 @@
         if epoch_step == 0 or epoch_step_val == 0:
             raise ValueError('数据集过小，无法进行训练，请扩充数据集。')
 
-        train_dataloader    = YoloDatasets(train_lines, input_shape, anchors, batch_size, num_classes, anchors_mask, Init_Epoch, UnFreeze_Epoch, mosaic = mosaic, train = True)
-        val_dataloader      = YoloDatasets(val_lines, input_shape, anchors, batch_size, num_classes, anchors_mask, Init_Epoch, UnFreeze_Epoch, mosaic = False, train = False)
+        train_dataloader    = YoloDatasets(train_lines, input_shape, anchors, batch_size, num_classes, anchors_mask, Init_Epoch, UnFreeze_Epoch, \
+                                            mosaic=mosaic, mixup=mixup, mosaic_prob=mosaic_prob, mixup_prob=mixup_prob, train=True, special_aug_ratio=special_aug_ratio)
+        val_dataloader      = YoloDatasets(val_lines, input_shape, anchors, batch_size, num_classes, anchors_mask, Init_Epoch, UnFreeze_Epoch, \
+                                            mosaic=False, mixup=False, mosaic_prob=0, mixup_prob=0, train=False, special_aug_ratio=0)
 
         #-------------------------------------------------------------------------------#
         #   训练参数的设置
diff --git a/utils/dataloader.py b/utils/dataloader.py
@@ -9,7 +9,8 @@
 
 
 class YoloDatasets(keras.utils.Sequence):
-    def __init__(self, annotation_lines, input_shape, anchors, batch_size, num_classes, anchors_mask, epoch_now, epoch_length, mosaic, train, mosaic_ratio = 0.7):
+    def __init__(self, annotation_lines, input_shape, anchors, batch_size, num_classes, anchors_mask, epoch_now, epoch_length, \
+                        mosaic, mixup, mosaic_prob, mixup_prob, train, special_aug_ratio = 0.7):
         self.annotation_lines   = annotation_lines
         self.length             = len(self.annotation_lines)
         
@@ -21,10 +22,11 @@ def __init__(self, annotation_lines, input_shape, anchors, batch_size, num_class
         self.epoch_now          = epoch_now - 1
         self.epoch_length       = epoch_length
         self.mosaic             = mosaic
+        self.mosaic_prob        = mosaic_prob
+        self.mixup              = mixup
+        self.mixup_prob         = mixup_prob
         self.train              = train
-        self.mosaic_ratio       = mosaic_ratio
-
-        self.threshold          = 4
+        self.special_aug_ratio  = special_aug_ratio
 
     def __len__(self):
         return math.ceil(len(self.annotation_lines) / float(self.batch_size))
@@ -38,14 +40,16 @@ def __getitem__(self, index):
             #   训练时进行数据的随机增强
             #   验证时不进行数据的随机增强
             #---------------------------------------------------#
-            if self.mosaic:
-                if self.rand() < 0.5 and self.epoch_now < self.epoch_length * self.mosaic_ratio:
-                    lines = sample(self.annotation_lines, 3)
-                    lines.append(self.annotation_lines[i])
-                    shuffle(lines)
-                    image, box = self.get_random_data_with_Mosaic(lines, self.input_shape)
-                else:
-                    image, box = self.get_random_data(self.annotation_lines[i], self.input_shape, random = self.train)
+            if self.mosaic and self.rand() < self.mosaic_prob and self.epoch_now < self.epoch_length * self.special_aug_ratio:
+                lines = sample(self.annotation_lines, 3)
+                lines.append(self.annotation_lines[i])
+                shuffle(lines)
+                image, box = self.get_random_data_with_Mosaic(lines, self.input_shape)
+                    
+                if self.mixup and self.rand() < self.mixup_prob:
+                    lines           = sample(self.annotation_lines, 1)
+                    image_2, box_2  = self.get_random_data(lines[0], self.input_shape, random = self.train)
+                    image, box      = self.get_random_data_with_MixUp(image, box, image_2, box_2)
             else:
                 image, box  = self.get_random_data(self.annotation_lines[i], self.input_shape, random = self.train)
             image_data.append(preprocess_input(np.array(image, np.float32)))
@@ -368,6 +372,25 @@ def get_random_data_with_Mosaic(self, annotation_line, input_shape, max_boxes=50
             box_data[:len(new_boxes)] = new_boxes
         return new_image, box_data
 
+    def get_random_data_with_MixUp(self, image_1, box_1, image_2, box_2, max_boxes=500):
+        new_image = np.array(image_1, np.float32) * 0.5 + np.array(image_2, np.float32) * 0.5
+        
+        box_1_wh    = box_1[:, 2:4] - box_1[:, 0:2]
+        box_1_valid = box_1_wh[:, 0] > 0
+        
+        box_2_wh    = box_2[:, 2:4] - box_2[:, 0:2]
+        box_2_valid = box_2_wh[:, 0] > 0
+        
+        new_boxes = np.concatenate([box_1[box_1_valid, :], box_2[box_2_valid, :]], axis=0)
+        #---------------------------------#
+        #   将box进行调整
+        #---------------------------------#
+        box_data = np.zeros((max_boxes, 5))
+        if len(new_boxes)>0:
+            if len(new_boxes)>max_boxes: new_boxes = new_boxes[:max_boxes]
+            box_data[:len(new_boxes)] = new_boxes
+        return new_image, box_data
+
     def preprocess_true_boxes(self, true_boxes, input_shape, anchors, num_classes):
         assert (true_boxes[..., 4]<num_classes).all(), 'class id must be less than num_classes'
         #-----------------------------------------------------------#