基於深度學習的CT影象肺結節自動檢測技術四—資料增強—定義神經網路並訓練

阿新 • • 發佈：2019-01-05

開發環境 jupyter notebook

# -- coding: utf-8 --
#訓練影象分割網路(u-net)模型
import csv
import glob
import random
import cv2
import numpy
import os
from typing import List, Tuple
from keras.optimizers import SGD
from keras.layers import Input, Convolution2D, MaxPooling2D, 
                         UpSampling2D, merge, 
 BatchNormalization, SpatialDropout2D
from keras.models import Model
from keras import backend as K
from keras.callbacks import ModelCheckpoint, Callback
from scipy.ndimage.interpolation import map_coordinates
from scipy.ndimage.filters import gaussian_filter    #高斯卷積核

MEAN_FRAME_COUNT = 1
CHANNEL_COUNT = 
 1
SEGMENTER_IMG_SIZE = 320
MODEL_DIR = './model/'
BATCH_SIZE = 8

TRAIN_LIST = ''
VAL_LIST = ''
TRAIN_TEMP_DIR = './temp_dir/chapter4/'

資料增強

# 隨機縮放影象的函式，用於資料增廣(augmentation)
def random_scale_img(img, xy_range, lock_xy=False):
    if random.random() > xy_range.chance:
        return img

    if not isinstance 
(img, list):
        img = [img]

    import cv2
    scale_x = random.uniform(xy_range.x_min, xy_range.x_max)
    scale_y = random.uniform(xy_range.y_min, xy_range.y_max)
    if lock_xy:
        scale_y = scale_x

    org_height, org_width = img[0].shape[:2]
    xy_range.last_x = scale_x
    xy_range.last_y = scale_y

    res = []
    for img_inst in img:
        scaled_width = int(org_width * scale_x)
        scaled_height = int(org_height * scale_y)
        scaled_img = cv2.resize(img_inst, (scaled_width, scaled_height), interpolation=cv2.INTER_CUBIC)
        if scaled_width < org_width:
            extend_left = (org_width - scaled_width) / 2
            extend_right = org_width - extend_left - scaled_width
            scaled_img = cv2.copyMakeBorder(scaled_img, 0, 0, extend_left, extend_right, borderType=cv2.BORDER_CONSTANT)
            scaled_width = org_width

        if scaled_height < org_height:
            extend_top = (org_height - scaled_height) / 2
            extend_bottom = org_height - extend_top - scaled_height
            scaled_img = cv2.copyMakeBorder(scaled_img, extend_top, extend_bottom, 0, 0, borderType=cv2.BORDER_CONSTANT)
            scaled_height = org_height

        start_x = (scaled_width - org_width) / 2
        start_y = (scaled_height - org_height) / 2
        tmp = scaled_img[start_y: start_y + org_height, start_x: start_x + org_width]
        res.append(tmp)

    return res


class XYRange:
    def __init__(self, x_min, x_max, y_min, y_max, chance=1.0):
        self.chance = chance
        self.x_min = x_min
        self.x_max = x_max
        self.y_min = y_min
        self.y_max = y_max
        self.last_x = 0
        self.last_y = 0

    def get_last_xy_txt(self):
        res = "x_" + str(int(self.last_x * 100)).replace("-", "m") + "-" + "y_" + str(int(self.last_y * 100)).replace(
            "-", "m")
        return res


# 隨機變換影象的函式，用於資料增廣(augmentation)
def random_translate_img(img, xy_range, border_mode="constant"):
    if random.random() > xy_range.chance:
        return img
    import cv2
    if not isinstance(img, list):
        img = [img]

    org_height, org_width = img[0].shape[:2]
    translate_x = random.randint(xy_range.x_min, xy_range.x_max)
    translate_y = random.randint(xy_range.y_min, xy_range.y_max)
    trans_matrix = numpy.float32([[1, 0, translate_x], [0, 1, translate_y]])

    border_const = cv2.BORDER_CONSTANT
    if border_mode == "reflect":
        border_const = cv2.BORDER_REFLECT

    res = []
    for img_inst in img:
        img_inst = cv2.warpAffine(img_inst, trans_matrix, (org_width, org_height), borderMode=border_const)
        res.append(img_inst)
    if len(res) == 1:
        res = res[0]
    xy_range.last_x = translate_x
    xy_range.last_y = translate_y
    return res


# 隨機旋轉影象的函式，用於資料增廣(augmentation)
def random_rotate_img(img, chance, min_angle, max_angle):
    import cv2
    if random.random() > chance:
        return img
    if not isinstance(img, list):
        img = [img]

    angle = random.randint(min_angle, max_angle)
    center = (img[0].shape[0] / 2, img[0].shape[1] / 2)
    rot_matrix = cv2.getRotationMatrix2D(center, angle, scale=1.0)

    res = []
    for img_inst in img:
        img_inst = cv2.warpAffine(img_inst, rot_matrix, dsize=img_inst.shape[:2], borderMode=cv2.BORDER_CONSTANT)
        res.append(img_inst)
    if len(res) == 0:
        res = res[0]
    return res


# 反轉影象的函式，用於資料增廣(augmentation)
def random_flip_img(img, horizontal_chance=0, vertical_chance=0):
    import cv2
    flip_horizontal = False
    if random.random() < horizontal_chance:
        flip_horizontal = True

    flip_vertical = False
    if random.random() < vertical_chance:
        flip_vertical = True

    if not flip_horizontal and not flip_vertical:
        return img

    flip_val = 1
    if flip_vertical:
        flip_val = -1 if flip_horizontal else 0

    if not isinstance(img, list):
        res = cv2.flip(img, flip_val)  # 0 = X axis, 1 = Y axis,  -1 = both
    else:
        res = []
        for img_item in img:
            img_flip = cv2.flip(img_item, flip_val)
            res.append(img_flip)
    return res


ELASTIC_INDICES = None


# 影象彈性變換的函式，用於資料增廣(augmentation)
def elastic_transform(image, alpha, sigma, random_state=None):
    global ELASTIC_INDICES
    shape = image.shape

    if ELASTIC_INDICES == None:
        if random_state is None:
            random_state = numpy.random.RandomState(1301)

        dx = gaussian_filter((random_state.rand(*shape) * 2 - 1), sigma, mode="constant", cval=0) * alpha
        dy = gaussian_filter((random_state.rand(*shape) * 2 - 1), sigma, mode="constant", cval=0) * alpha
        x, y = numpy.meshgrid(numpy.arange(shape[0]), numpy.arange(shape[1]))
        ELASTIC_INDICES = numpy.reshape(y + dy, (-1, 1)), numpy.reshape(x + dx, (-1, 1))
    return map_coordinates(image, ELASTIC_INDICES, order=1).reshape(shape)

測試前影象準備—影象資料型別轉換—通道歸一化（灰度圖）

#影象型別轉換，通道歸一化（灰度圖）
def prepare_image_for_net(img):
    img = img.astype(numpy.float)
    img /= 255.
    if len(img.shape) == 3:
        img = img.reshape(img.shape[-3], img.shape[-2], img.shape[-1])
    else:
        img = img.reshape(1, img.shape[-2], img.shape[-1], 1)
    return img


# 訓練集圖片預處理函式
def get_train_holdout_files():
    train_path = TRAIN_LIST
    val_path = VAL_LIST
    train_res = []
    holdout_res = []
    with open(train_path, 'r') as f:
        reader = csv.reader(f)
        samples_train = list(reader)
        random.shuffle(samples_train)
    with open(val_path, 'r') as f:
        reader = csv.reader(f)
        samples_holdout = list(reader)
        random.shuffle(samples_holdout)
    for img_path in samples_train:
        if len(img_path) == 0:
            print('space line, skip')
            continue
        overlay_path = img_path[0].replace("_img.png", "_mask.png")
        train_res.append((img_path[0], overlay_path))

    for img_path in samples_holdout:
        if len(img_path) == 0:
            print('space line, skip')
            continue
        overlay_path = img_path[0].replace("_img.png", "_mask.png")
        holdout_res.append((img_path[0], overlay_path))

    print("Train count: ", len(train_res), ", holdout count: ", len(holdout_res))
    return train_res, holdout_res

定義神經網路並訓練

# unet模型損失函式
def dice_coef(y_true, y_pred):
    y_true_f = K.flatten(y_true)
    y_pred_f = K.flatten(y_pred)
    intersection = K.sum(y_true_f * y_pred_f)
    return (2. * intersection + 100) / (K.sum(y_true_f) + K.sum(y_pred_f) + 100)


# unet模型損失函式
def dice_coef_np(y_true, y_pred):
    y_true_f = y_true.flatten()
    y_pred_f = y_pred.flatten()
    intersection = numpy.sum(y_true_f * y_pred_f)
    return (2. * intersection + 100) / (numpy.sum(y_true_f) + numpy.sum(y_pred_f) + 100)


# unet模型損失函式
def dice_coef_loss(y_true, y_pred):
    return -dice_coef(y_true, y_pred)


# 將每個epoch結束後的驗證結果儲存為圖片
class DumpPredictions(Callback):
    def __init__(self, dump_filelist: List[Tuple[str, str]], model_type):
        super(DumpPredictions, self).__init__()
        self.dump_filelist = dump_filelist
        self.batch_count = 0
        if not os.path.exists(TRAIN_TEMP_DIR):
            os.mkdir(TRAIN_TEMP_DIR)
        for file_path in glob.glob(TRAIN_TEMP_DIR + "*.*"):
            os.remove(file_path)
        self.model_type = model_type

    def on_epoch_end(self, epoch, logs=None):
        model = self.model  # type: Model
        generator = image_generator(self.dump_filelist, 1, train_set=False)
        for i in range(0, 10):
            x, y = next(generator)
            y_pred = model.predict(x, batch_size=1)

            x = x.swapaxes(0, 3)
            x = x[0]
            # print(x.shape, y.shape, y_pred.shape)
            x *= 255.
            x = x.reshape((x.shape[0], x.shape[0])).astype(numpy.uint8)
            y *= 255.
            y = y.reshape((y.shape[1], y.shape[2])).astype(numpy.uint8)
            y_pred *= 255.
            y_pred = y_pred.reshape((y_pred.shape[1], y_pred.shape[2])).astype(numpy.uint8)
            cv2.imwrite(TRAIN_TEMP_DIR + "img_{0:03d}_{1:02d}_i.png".format(epoch, i), x)
            cv2.imwrite(TRAIN_TEMP_DIR + "img_{0:03d}_{1:02d}_o.png".format(epoch, i), y)
            cv2.imwrite(TRAIN_TEMP_DIR + "img_{0:03d}_{1:02d}_p.png".format(epoch, i), y_pred)


# 訓練集資料載入器
def image_generator(batch_files, batch_size, train_set):
    global ELASTIC_INDICES
    while True:
        if train_set:
            random.shuffle(batch_files)

        img_list = []
        overlay_list = []
        ELASTIC_INDICES = None
        for batch_file_idx, batch_file in enumerate(batch_files):
            images = []
            img = cv2.imread(batch_file[0], cv2.IMREAD_GRAYSCALE)
            images.append(img)
            overlay = cv2.imread(batch_file[1], cv2.IMREAD_GRAYSCALE)

            if train_set:
                if random.randint(0, 100) > 50:
                    for img_index, img in enumerate(images):
                        images[img_index] = elastic_transform(img, 128, 15)
                    overlay = elastic_transform(overlay, 128, 15)

                if True:
                    augmented = images + [overlay]
                    augmented = random_rotate_img(augmented, 0.8, -20, 20)
                    augmented = random_flip_img(augmented, 0.5, 0.5)

                    augmented = random_translate_img(augmented, XYRange(-30, 30, -30, 30, 0.8))
                    images = augmented[:-1]
                    overlay = augmented[-1]

            for index, img in enumerate(images):
                img = prepare_image_for_net(img)
                images[index] = img

            overlay = prepare_image_for_net(overlay)
            images3d = numpy.vstack(images)
            images3d = images3d.swapaxes(0, 3)

            img_list.append(images3d)
            overlay_list.append(overlay)
            if len(img_list) >= batch_size:
                x = numpy.vstack(img_list)
                y = numpy.vstack(overlay_list)
                # if len(img_list) >= batch_size:
                yield x, y
                img_list = []
                overlay_list = []


# 實現unet的網路結構，並載入預訓練好的權重
def get_unet(learn_rate=0.0001

 
 
              
           
              
              
            
            相關推薦
			   
            
            
            
 

    

    
    基於深度學習的CT影象肺結節自動檢測技術四—資料增強—定義神經網路並訓練
      
							
							
							
開發環境 jupyter notebook
# -- coding: utf-8 --
#訓練影象分割網路(u-net)模型
import csv
import glob
import random
import cv2
import numpy
import 

  
 

    

    
    基於深度學習的CT影象肺結節自動檢測技術一——資料預處理（歸一化，資料增強，資料標記）
      
							
							
							
 開發環境 Anaconda:jupyter notebook /pycharm
pip install SimpleItk        # 讀取CT醫學影象
pip install tqdm             # 可擴充套件的Python進度條，封裝 

  
 

    

    
    基於深度學習的CT影象肺結節自動檢測技術六—模型預測
      
							
							
							#模型預測的相關功能

from chapter4 import get_unet
from chapter5 import get_3dnnnet, stack_2dcube_to_3darray, prepare_image_for_net3D, MEAN_ 

  
 

    

    
    基於深度學習的CT影象肺結節自動檢測技術五—3dcnn優化模型
      
							
							
							import os
import random
from keras import layers
from keras import backend as K
from keras.layers import Input, Convolution3D, MaxP 

  
 

    

    
    基於深度學習的CT影象肺結節自動檢測技術二——訓練資料處理
      
							
							
							
開發環境 Anaconda:jupyter notebook/pycharm
pip install dicom            # 用於讀取 dicom 圖片(version0.9.9)
pip install SimpleItk        # 讀 

  
 

    

    
    基於深度學習的CT影象肺結節自動檢測（系列放在一起）
       
 
 PS 為了方便查詢，將SongpingWang的肺結節系列部落格放在一起。（剛好公司要我開始接手這一塊）感謝大神 
 具體連結： 
 0 ：https://blog.csdn.net/wsp_1138886114/article/details/81840891 
 1 ：https://blog. 

  
 

    

    
    學習筆記之——基於深度學習的影象超解析度重構
       
 
 
        最近開展影象超解析度（ Image Super Resolution）方面的研究，做了一些列的調研，並結合本人的理解總結成本博文~（本博文僅用於本人的學習筆記，不做商業用途） 
 本博文涉及的paper已經打包，供各位看客下載哈~h 

  
 

    

    
    基於深度學習的影象檢索 image retrieval based on deep learning （code ，程式碼）
       
 
 本次程式碼分享主要是用的caffe框架，至於caffe框架的安裝過程不再說明。程式碼修改自“cross weights”的一篇2016年的文章，但是名字忘記了，誰記得，提醒我下。
 一、環境要求
         1、python
 &nb 

  
 

    

    
    基於深度學習的影象質量排序
       
 
 國內外各大網際網路公司（比如騰訊、阿里和Yelp）的線上廣告業務都在關注展示什麼樣的影象能吸引更多點選。在美團，商家的首圖是由商家或運營人工指定的，如何選擇首圖才能更好地吸引使用者呢？影象質量排序演算法目標就是做到自動選擇更優質的首圖，以吸引使用者點選。 
 傳統的影象質量排序方法主要從美學角度進行 

  
 

    

    
    基於深度學習的影象語義分割技術概述之4常用方法 5.4未來研究方向
       
 
 https://blog.csdn.net/u014593748/article/details/72794459
 
 本文為論文閱讀筆記，不當之處，敬請指正。 A Review on Deep Learning Techniques Applied to Semantic Segmen 

  
 

    

    
    基於深度學習的影象修復—心中無碼
       
  
  
 一、前言 
 影象修復在應用上非常吸引人，通常設計師需要使用 Photoshop 根據影象周圍修復空缺部分。這一過程非常耗時和細緻，因此很早就有研究嘗試使用機器學習模型自動化這一過程。 這篇文章介紹了 DeepCreamPy 專案，它可以自動修復漫畫影象中的空缺部分和馬賽克。該專案使用部分卷 

  
 

    

    
    基於深度學習的影象語義分割演算法綜述（截止20180715）
      
                



這篇文章講述卷積神經網路在影象語義分割（semantic image segmentation）的應用。影象分割這項計算機視覺任務需要判定一張圖片中特定區域的所屬類別。


這個影象裡有什麼？它在影象中哪個位置？


更具體地說，影象語義分割的目標是將影象的每個畫素所 

  
 

    

    
    基於深度學習的影象分割總結
      
                一、影象分割類別

隨著深度學習的發展，在分割任務中出現了許多優秀的網路。根據實際分割應用任務的不同，可以大致將分割分為三個研究方向：語義分割、例項分割、全景分割。這三種分割在某種意義上是具有一定的聯絡的。

語義分割：

畫素級別的語義分割，對影象中的每個畫素都劃分出對應的 

  
 

    

    
    如何基於深度學習實現影象的智慧稽核
       
 
 
 如何基於深度學習實現影象的智慧稽核 
 背景 
 美團每天有百萬級的圖片產生量，運營人員負責相關圖片的內容稽核，對涉及法律風險及不符合平臺規定的圖片進行刪除操作。由於圖片數量巨大，人工稽核耗時耗力且稽核能力有限。另外對於不同稽核人員來講，稽核標準難以統一且實時變化。所以有必要藉助機器實現智慧稽核 

  
 

    

    
    基於深度學習的影象壓縮
       
 
 近年來，深度學習在計算機視覺領域已經佔據主導地位，不論是在影象識別還是超分辨重現上，深度學習已成為圖片研究的重要技術，但它們的能力並不僅限於這些任務；現在深度學習技術已進入圖片壓縮領域。下面就說說神經網路在影象壓縮領域的應用。 
 當前主要圖片壓縮演算法 
 說到影象壓縮演算法，目前市面上影響力比較 

  
 

    

    
    乾貨 | 美團如何基於深度學習實現影象的智慧稽核？
      [1]H. Chen, S. S. Tsai, G. Schroth, D. M. Chen, R. Grzeszczuk, and B. Girod. “Robust text detection in natural images with edge-enhanced maximally stable e 

  
 

    

    
    基於深度學習的影象語義分析及其應用
      
                
本文 轉自“火光搖曳”部落格：語義分析的一些方法(三)，主要論述了基於深度學習方法的影象語義分析，包括圖片分類、圖片搜尋、圖片標註（image2text、image2sentence），以及訓練深度神經網路的一些tricks，並介紹語義分析方法在騰訊廣點通上的實際應用。以下 

  
 

    

    
    基於深度學習的影象去噪暨SRMD論文閱讀筆記
       
 
 
 最近一直在做基於卷積神經網路的影象去噪~感覺資料比較凌亂，本博文就是整理好經典的論文材料~ 
 同時本博文也結合了閱讀論文《Learning a Single Convolutional Super-Resolution Network for Multiple Degradations》時的心 

  
 

    

    
    基於深度學習的影象去噪（論文總結）
      2015
深度學習、自編碼器、低照度影象增強
Lore, Kin Gwn, Adedotun Akintayo, and Soumik Sarkar. "LLNet: A Deep Autoencoder Approach to Natural Low-light Image Enhancement." ar 

  
 

    

    
    Amazon Rekognition常見問題_基於深度學習的影象分析服務問題
       
           問：什麼是 Amazon Rekognition？ 
           Amazon Rekognition 作為一項服務，能夠讓您輕鬆地將功能強大的視覺化分析新增到應用程式。藉助 Rekognition Image，您可以輕鬆構建功能強大的應用程式來搜尋、驗證和組織數百萬個影象