基於深度學習的CT影象肺結節自動檢測技術二——訓練資料處理

阿新 • • 發佈：2019-02-12

開發環境 Anaconda:jupyter notebook/pycharm

pip install dicom            # 用於讀取 dicom 圖片(version0.9.9)
pip install SimpleItk        # 讀取CT醫學影象
pip install tqdm             # 可擴充套件的Python進度條，封裝迭代器 
pip install pydicom          # 用於讀取 dicom 圖片
pip install opencv-python

一、訓練資料處理

讀取dicom 圖片—提取4000mm畫素

# 準備3dcnn的訓練資料 

import os
import SimpleITK
import dicom
import numpy as np
import cv2
import glob
from tqdm import tqdm


def is_dicom_file(filename):
    """
           判斷某檔案是否是dicom格式的檔案
    :param filename: dicom檔案的路徑
    :return:
    """

    file_stream = open(filename, 'rb')
    file_stream.seek(128)
    data = 
 file_stream.read(4)
    file_stream.close()
    if data == b'DICM':
        return True
    return False


def load_patient(src_dir):

    #讀取某資料夾內的所有dicom檔案

    files = os.listdir(src_dir)
    slices = []
    for s in files:
        if is_dicom_file(src_dir + '/' + s):
            instance = dicom. 
read_file(src_dir + '/' + s)
            slices.append(instance)
    slices.sort(key=lambda x: int(x.InstanceNumber))
    try:
        slice_thickness = np.abs(slices[0].ImagePositionPatient[2]\
                                 - slices[1].ImagePositionPatient[2])
    except:
        slice_thickness = np.abs(slices[0].SliceLocation - slices[1].SliceLocation)

    for s in slices:
        s.SliceThickness = slice_thickness
    return slices


def get_pixels_hu_by_simpleitk(dicom_dir):

    #讀取某資料夾內的所有dicom檔案,並提取畫素值(-4000 ~ 4000)

    reader = SimpleITK.ImageSeriesReader()
    dicom_names = reader.GetGDCMSeriesFileNames(dicom_dir)
    reader.SetFileNames(dicom_names)
    image = reader.Execute()
    img_array = SimpleITK.GetArrayFromImage(image)
    img_array[img_array == -2000] = 0
    return img_array

將dicom影象歸一化（1mm*3的尺度）

def rescale_patient_images(images_zyx, org_spacing_xyz, target_voxel_mm, is_mask_image=False):
    """
            將dicom影象縮放到1mm:1mm:1mm的尺度
        :param images_zyx: 縮放前的影象(3維)
        :return: 縮放後的影象(3維)

    """

    print("Spacing: ", org_spacing_xyz)
    print("Shape: ", images_zyx.shape)

    # print ("Resizing dim z")
    resize_x = 1.0
    resize_y = float(org_spacing_xyz[2]) / float(target_voxel_mm)
    interpolation = cv2.INTER_NEAREST if is_mask_image else cv2.INTER_LINEAR
    res = cv2.resize(images_zyx, dsize=None, fx=resize_x, fy=resize_y, interpolation=interpolation)
    # print ("Shape is now : ", res.shape)

    res = res.swapaxes(0, 2)
    res = res.swapaxes(0, 1)
    # print ("Shape: ", res.shape)
    resize_x = float(org_spacing_xyz[0]) / float(target_voxel_mm)
    resize_y = float(org_spacing_xyz[1]) / float(target_voxel_mm)

    # cv2 can handle max 512 channels..
    if res.shape[2] > 512:
        res = res.swapaxes(0, 2)
        res1 = res[:256]
        res2 = res[256:]
        res1 = res1.swapaxes(0, 2)
        res2 = res2.swapaxes(0, 2)
        res1 = cv2.resize(res1, dsize=None, fx=resize_x, fy=resize_y, interpolation=interpolation)
        res2 = cv2.resize(res2, dsize=None, fx=resize_x, fy=resize_y, interpolation=interpolation)
        res1 = res1.swapaxes(0, 2)
        res2 = res2.swapaxes(0, 2)
        res = np.vstack([res1, res2])
        res = res.swapaxes(0, 2)
    else:
        res = cv2.resize(res, dsize=None, fx=resize_x, fy=resize_y, interpolation=interpolation)

    res = res.swapaxes(0, 2)
    res = res.swapaxes(2, 1)

    print("Shape after: ", res.shape)
    return res

切割為小cube並平鋪儲存為png

def get_cube_from_img(img3d, center_x, center_y, center_z, block_size):
    #切割為小cube並平鋪儲存為png
    start_x = max(center_x - block_size / 2, 0)
    if start_x + block_size > img3d.shape[2]:
        start_x = img3d.shape[2] - block_size

    start_y = max(center_y - block_size / 2, 0)
    start_z = max(center_z - block_size / 2, 0)
    if start_z + block_size > img3d.shape[0]:
        start_z = img3d.shape[0] - block_size
    start_z = int(start_z)
    start_y = int(start_y)
    start_x = int(start_x)
    res = img3d[start_z:start_z + block_size,
                start_y:start_y + block_size,
                start_x:start_x + block_size]
    return res

4000mm畫素值歸一化—>讀取影象：3維cube影象（儲存為2維影象方便檢視）

def normalize_hu(image):

    """
    將輸入影象的畫素值(-4000 ~ 4000)歸一化到0~1之間
    :param image 輸入的影象陣列
    :return: 歸一化處理後的影象陣列
    """

    MIN_BOUND = -1000.0
    MAX_BOUND = 400.0
    image = (image - MIN_BOUND) / (MAX_BOUND - MIN_BOUND)
    image[image > 1] = 1.
    image[image < 0] = 0.
    return image


def load_patient_images(src_dir, wildcard="*.*", exclude_wildcards=[]):
    """
        讀取一個病例的所有png影象，返回值為一個三維影象陣列
    :param image 輸入的一系列png影象
    :return: 三維影象陣列
    """

    src_img_paths = glob.glob(src_dir + wildcard)
    for exclude_wildcard in exclude_wildcards:
        exclude_img_paths = glob.glob(src_dir + exclude_wildcard)
        src_img_paths = [im for im in src_img_paths if im not in exclude_img_paths]
    src_img_paths.sort()
    images = [cv2.imread(img_path, cv2.IMREAD_GRAYSCALE) for img_path in src_img_paths]
    images = [im.reshape((1,) + im.shape) for im in images]
    res = np.vstack(images)
    return res


def save_cube_img(target_path, cube_img, rows, cols):
    """
        將3維cube影象儲存為2維影象,方便勘誤檢查
    :param 二維影象儲存路徑, 三維輸入影象
    :return: 二維影象
    """

    assert rows * cols == cube_img.shape[0]
    img_height = cube_img.shape[1]
    img_width = cube_img.shape[1]
    res_img = np.zeros((rows * img_height, cols * img_width), dtype=np.uint8)

    for row in range(rows):
        for col in range(cols):
            target_y = row * img_height
            target_x = col * img_width
            res_img[target_y:target_y + img_height,
                    target_x:target_x + img_width] = cube_img[row * cols + col]

    cv2.imwrite(target_path, res_img)


if __name__ == '__main__':
    dicom_dir = './data/dicom_demo/'
   
    slices = load_patient(dicom_dir)                  # 讀取dicom檔案的元資料(dicom tags)
    
    pixel_spacing = slices[0].PixelSpacing           # 獲取dicom的spacing值
    pixel_spacing.append(slices[0].SliceThickness)
    print('The dicom spacing : ', pixel_spacing)
    
    image = get_pixels_hu_by_simpleitk(dicom_dir)    # 提取dicom檔案中的畫素值
    # 標準化不同規格的影象尺寸, 統一將dicom影象縮放到1mm:1mm:1mm的尺度
    image = rescale_patient_images(image, pixel_spacing, 1.00)
    for i in tqdm(range(image.shape[0])):
        img_path = "./temp_dir/dcm_2_png/img_" + str(i).rjust(4, '0') + "_i.png"
        
        org_img = normalize_hu(image[i])             # 將畫素值歸一化到[0,1]區間
        
        cv2.imwrite(img_path, org_img * 255)         # 儲存影象陣列為灰度圖(.png)

    # 載入上一步生成的png影象
    pngs = load_patient_images("./temp_dir/dcm_2_png/", "*_i.png")
    # 輸入人工標記的結節位置: coord_x, coord_y, coord_z
    cube_img = get_cube_from_img(pngs, 272, 200, 134, 64)
    print(cube_img)
    save_cube_img('./temp_dir/chapter3_3dcnn_img_X.png', cube_img, 8, 8)

基於深度學習的CT影象肺結節自動檢測技術二——訓練資料處理

開發環境 Anaconda:jupyter notebook/pycharm pip install dicom # 用於讀取 dicom 圖片(version0.9.9) pip install SimpleItk # 讀

基於深度學習的CT影象肺結節自動檢測技術六—模型預測

#模型預測的相關功能 from chapter4 import get_unet from chapter5 import get_3dnnnet, stack_2dcube_to_3darray, prepare_image_for_net3D, MEAN_

基於深度學習的CT影象肺結節自動檢測技術五—3dcnn優化模型

import os import random from keras import layers from keras import backend as K from keras.layers import Input, Convolution3D, MaxP

基於深度學習的CT影象肺結節自動檢測技術一——資料預處理（歸一化，資料增強，資料標記）

開發環境 Anaconda:jupyter notebook /pycharm pip install SimpleItk # 讀取CT醫學影象 pip install tqdm # 可擴充套件的Python進度條，封裝

基於深度學習的CT影象肺結節自動檢測技術四—資料增強—定義神經網路並訓練

開發環境 jupyter notebook # -- coding: utf-8 -- #訓練影象分割網路(u-net)模型 import csv import glob import random import cv2 import numpy import

基於深度學習的CT影象肺結節自動檢測（系列放在一起）

PS 為了方便查詢，將SongpingWang的肺結節系列部落格放在一起。（剛好公司要我開始接手這一塊）感謝大神具體連結： 0 ：https://blog.csdn.net/wsp_1138886114/article/details/81840891 1 ：https://blog.

學習筆記之——基於深度學習的影象超解析度重構

最近開展影象超解析度（ Image Super Resolution）方面的研究，做了一些列的調研，並結合本人的理解總結成本博文~（本博文僅用於本人的學習筆記，不做商業用途）本博文涉及的paper已經打包，供各位看客下載哈~h

基於深度學習的影象檢索 image retrieval based on deep learning （code ，程式碼）

本次程式碼分享主要是用的caffe框架，至於caffe框架的安裝過程不再說明。程式碼修改自“cross weights”的一篇2016年的文章，但是名字忘記了，誰記得，提醒我下。一、環境要求 1、python &nb

基於深度學習的影象質量排序

國內外各大網際網路公司（比如騰訊、阿里和Yelp）的線上廣告業務都在關注展示什麼樣的影象能吸引更多點選。在美團，商家的首圖是由商家或運營人工指定的，如何選擇首圖才能更好地吸引使用者呢？影象質量排序演算法目標就是做到自動選擇更優質的首圖，以吸引使用者點選。傳統的影象質量排序方法主要從美學角度進行

基於深度學習的影象語義分割技術概述之4常用方法 5.4未來研究方向

https://blog.csdn.net/u014593748/article/details/72794459 本文為論文閱讀筆記，不當之處，敬請指正。 A Review on Deep Learning Techniques Applied to Semantic Segmen

基於深度學習的影象修復—心中無碼

一、前言影象修復在應用上非常吸引人，通常設計師需要使用 Photoshop 根據影象周圍修復空缺部分。這一過程非常耗時和細緻，因此很早就有研究嘗試使用機器學習模型自動化這一過程。這篇文章介紹了 DeepCreamPy 專案，它可以自動修復漫畫影象中的空缺部分和馬賽克。該專案使用部分卷

基於深度學習的影象語義分割演算法綜述（截止20180715）

這篇文章講述卷積神經網路在影象語義分割（semantic image segmentation）的應用。影象分割這項計算機視覺任務需要判定一張圖片中特定區域的所屬類別。這個影象裡有什麼？它在影象中哪個位置？更具體地說，影象語義分割的目標是將影象的每個畫素所

基於深度學習的影象分割總結

一、影象分割類別隨著深度學習的發展，在分割任務中出現了許多優秀的網路。根據實際分割應用任務的不同，可以大致將分割分為三個研究方向：語義分割、例項分割、全景分割。這三種分割在某種意義上是具有一定的聯絡的。語義分割：畫素級別的語義分割，對影象中的每個畫素都劃分出對應的

如何基於深度學習實現影象的智慧稽核

如何基於深度學習實現影象的智慧稽核背景美團每天有百萬級的圖片產生量，運營人員負責相關圖片的內容稽核，對涉及法律風險及不符合平臺規定的圖片進行刪除操作。由於圖片數量巨大，人工稽核耗時耗力且稽核能力有限。另外對於不同稽核人員來講，稽核標準難以統一且實時變化。所以有必要藉助機器實現智慧稽核

基於深度學習的影象壓縮

近年來，深度學習在計算機視覺領域已經佔據主導地位，不論是在影象識別還是超分辨重現上，深度學習已成為圖片研究的重要技術，但它們的能力並不僅限於這些任務；現在深度學習技術已進入圖片壓縮領域。下面就說說神經網路在影象壓縮領域的應用。當前主要圖片壓縮演算法說到影象壓縮演算法，目前市面上影響力比較

乾貨 | 美團如何基於深度學習實現影象的智慧稽核？

[1]H. Chen, S. S. Tsai, G. Schroth, D. M. Chen, R. Grzeszczuk, and B. Girod. “Robust text detection in natural images with edge-enhanced maximally stable e

基於深度學習的影象語義分析及其應用

本文轉自“火光搖曳”部落格：語義分析的一些方法(三)，主要論述了基於深度學習方法的影象語義分析，包括圖片分類、圖片搜尋、圖片標註（image2text、image2sentence），以及訓練深度神經網路的一些tricks，並介紹語義分析方法在騰訊廣點通上的實際應用。以下

基於深度學習的影象去噪暨SRMD論文閱讀筆記

最近一直在做基於卷積神經網路的影象去噪~感覺資料比較凌亂，本博文就是整理好經典的論文材料~ 同時本博文也結合了閱讀論文《Learning a Single Convolutional Super-Resolution Network for Multiple Degradations》時的心

基於深度學習的影象去噪（論文總結）

2015 深度學習、自編碼器、低照度影象增強 Lore, Kin Gwn, Adedotun Akintayo, and Soumik Sarkar. "LLNet: A Deep Autoencoder Approach to Natural Low-light Image Enhancement." ar

Amazon Rekognition常見問題_基於深度學習的影象分析服務問題

問：什麼是 Amazon Rekognition？ Amazon Rekognition 作為一項服務，能夠讓您輕鬆地將功能強大的視覺化分析新增到應用程式。藉助 Rekognition Image，您可以輕鬆構建功能強大的應用程式來搜尋、驗證和組織數百萬個影象

基於深度學習的CT影象肺結節自動檢測技術二——訓練資料處理

一、訓練資料處理

讀取dicom 圖片—提取4000mm畫素

將dicom影象歸一化（1mm*3的尺度）

切割為小cube並平鋪儲存為png

4000mm畫素值歸一化—>讀取影象：3維cube影象（儲存為2維影象方便檢視）

相關推薦