training_framework_openpose.py

from training_framework import TrainingProcess, EvaluationProcess
from tqdm import tqdm
from utils.utils_torch import transform_torch_vars, transform_torch_targets
import os
import cv2
from parse_poses import *
from utils.utils_image import draw_poses_for_coco, draw_hand_pose
import torch
from legacy_pose_extractor import extract_hand_pose

class TrainingProcessOpenPose(TrainingProcess):
    def __init__(self, *args,
                 is_triplet=False,
                 **kwargs):
        """
         config data loader and gpus using for training.
        :param training_dataloader:
        :param validate_dataloaer:
        :param optimizer:
        :param loss_func:
        :param gpus:
        # :param _model:
        # """
        super().__init__(*args, **kwargs)
        self.is_triplet = is_triplet
        self.global_step_lr = 0
        self.lr_this_step =0
        self.last_model_path = None

    def _show_log(self, train_info, pbar):
        self.writer.add_scalars("loss", {
            "Loss/train_sum": train_info[0],
            "Loss/train_paf": train_info[1],
            "Loss/train_heatmap": train_info[2],
            "Loss/lr": self.lr_this_step
        })
        pbar.set_postfix(loss='%.4f' %train_info[0],
                         loss_paf = '%.4f' %train_info[1],
                         loss_heatmap = '%.4f' %train_info[2],
                         lr = "%.6f" % self.lr_this_step)

    def train(self):
        """
        1) set parallel mode
        2) load pretrained data
        3) set train mode for _model and optimizer and loss
        4) loop with num epoch
        :return:
        """
        # init data
        smooth_loss_sum = None
        smooth_loss_paf = None
        smooth_loss_heatmap = None
        self._show_init_data()
        # setting
        self.model.train()
        ###### training ######
        for epoch_index in range(self.num_epoch):
            pbar = tqdm(enumerate(self.training_data),total= len(self.training_data), ncols=-1)
            for batch_id, data in pbar:
                loss_sum, loss_paf, loss_heatmap = self._train_per_batch(data)

                smooth_loss_sum = 0.5*smooth_loss_sum + 0.5* loss_sum \
                    if smooth_loss_sum is not None else loss_sum
                smooth_loss_paf = 0.5*smooth_loss_paf + 0.5* loss_paf \
                    if smooth_loss_paf is not None else loss_paf
                smooth_loss_heatmap = 0.5*smooth_loss_heatmap + 0.5* loss_heatmap \
                    if smooth_loss_heatmap is not None else loss_heatmap
                # log data
                self._show_log([smooth_loss_sum, smooth_loss_paf, smooth_loss_heatmap],pbar)

            # validate and log
            if epoch_index % 1 == 0:
                # run validation part
                val_loss = self._validate()
                self._save_model(val_loss, epoch_index)

    def _train_per_batch(self, data):
        """
            private func for batch train
        :param data:
        :param label:
        :return:
        """
        resized_img, paf_t, heatmap_t = data
        # transform data #
        resized_img = transform_torch_vars(resized_img, self.is_cuda)
        paf_t = transform_torch_targets(paf_t, self.is_cuda)
        heatmap_t = transform_torch_targets(heatmap_t, self.is_cuda)
        self.optimizer.zero_grad()

        paf, heatmap = self.model(resized_img)
        loss_sum, loss_paf, loss_heatmap = self.loss_func(paf, heatmap, paf_t, heatmap_t)

        if self.is_apex:
            # with apex.amp.scale_loss(loss_sum, self.optimizer) as scaled_loss:
            #     scaled_loss.backward()
            pass
        else:
            loss_sum.backward()
        self.optimizer.step()

        #update lr
        if self.scheduler is not None:
            self.lr_this_step = self.lr * self.scheduler.get_lr(self.global_step_lr, 0.03)
            for param_group in self.optimizer.param_groups:
                param_group['lr'] = self.lr_this_step
            self.global_step_lr +=1

        return loss_sum.item(), loss_paf, loss_heatmap

    def _validate(self):
        """
        private validate func
        :return: average of validated loss
        """
        self.model.eval()
        loss_val = 0
        with torch.no_grad():
            for data in tqdm(self.validate_data):
                resized_img, paf_t, heatmap_t = data
                resized_img = transform_torch_vars(resized_img, self.is_cuda)
                paf_t = transform_torch_targets(paf_t, self.is_cuda)
                heatmap_t = transform_torch_targets(heatmap_t, self.is_cuda)

                paf, heatmap = self.model(resized_img)

                loss_sum, _, _ = self.loss_func(paf, heatmap, paf_t, heatmap_t)
                loss_val += loss_sum.item()

        self.model.train()

        return loss_val / len(self.validate_data)

    def _save_model(self, val_loss, epoch_index):
        print("epoch=%d; val_loss=%.4f"%(epoch_index, val_loss))
        # early stop.
        if self.best_current_loss > val_loss:
            self.best_current_loss = val_loss
            print("save the best _model \t new best loss \t %.5f to file %s" % (self.best_current_loss,self.checkpoint_path))
            current_path = self.checkpoint_path + "epoch_%d_loss_%.4f.pth"%(epoch_index,val_loss)
            if self.is_cuda:
                torch.save(self.model.state_dict(),
                           self.checkpoint_path + "epoch_%d_loss_%.4f.pth"%(epoch_index,val_loss))
            else:
                torch.save(self.model.state_dict(),
                           self.checkpoint_path + "epoch_%d_loss_%.4f.pth"%(epoch_index,val_loss))
            if self.last_model_path is not None:
                os.remove(self.last_model_path)
            self.last_model_path = current_path


class EvaluationOpenPose(EvaluationProcess):
    def test(self, num_show = 100):
        self.model.eval()
        current_batch = 0
        sum = 0
        with torch.no_grad():
            for data in tqdm(self.test_data):
                current_time = cv2.getTickCount()
                resized_img, origin_image = data
                resized_img = transform_torch_vars(resized_img, self.is_cuda)
                origin_image = origin_image[0].numpy()
                paf, heatmap = self.model(resized_img)
                paf = paf.detach().cpu().numpy()[0]
                heatmap = heatmap.detach().cpu().numpy()[0]

                # view paf and heatmap here
                # self.view_paf_heatmap(paf, heatmap, current_batch)
                # parse paf and heatmap here
                self.parser_output((paf, heatmap), origin_image, current_batch)
                # self.parser_hand_output(heatmap,origin_image,current_batch)
                current_time = (cv2.getTickCount() - current_time) / cv2.getTickFrequency()
                sum += current_time
                current_batch+=1
                if current_batch >num_show:
                    print(current_batch)
                    print(sum/current_batch)
                    return

    def view_paf_heatmap(self, paf_batch, heatmap_batch,ind):
        paf_batch = paf_batch*255
        heatmap_batch = heatmap_batch*255
        for i,heatmap in enumerate(heatmap_batch):
            cv2.imwrite("./_image/heatmap_%d_%d.jpg" % (ind, i), heatmap)

        for i, paf in enumerate(paf_batch):
            cv2.imwrite("./_image/paf_%d_%d.jpg"%(ind, i), paf)

    def parser_output(self, pred, img, ind):
        current_time = cv2.getTickCount()
        poses_2d = parse_poses(pred,0.125)

        draw_poses_for_coco(img, poses_2d, is_filter=False)
        current_time = (cv2.getTickCount() - current_time) / cv2.getTickFrequency()
        cv2.putText(img, 'parsing time: {}'.format(current_time),
                    (10, 20), cv2.FONT_HERSHEY_COMPLEX, 1, (0, 0, 255))
        cv2.imwrite("./_image/img_coco_with_pose_%d.jpg"%ind, img)

    def parser_hand_output(self, pred_heat, img, ind):
        current_time = cv2.getTickCount()
        poses_2d = extract_hand_pose(pred_heat[0:-1],0.125)

        draw_hand_pose(img, poses_2d)
        current_time = (cv2.getTickCount() - current_time) / cv2.getTickFrequency()
        cv2.putText(img, 'parsing time: {}'.format(current_time),
                    (10, 20), cv2.FONT_HERSHEY_COMPLEX, 1, (0, 0, 255))
        cv2.imwrite("./_image/img_with_pose_%d.jpg"%ind, img)