[TensorFlow深度學習深入]實戰二·使用CNN網路識別破解數字驗證碼

阿新 • • 發佈：2018-12-22

[TensorFlow深度學習深入]實戰二·使用CNN網路識別破解數字驗證碼

參考部落格。
在此基礎上做了小修改。
其中CNN網路部分仿照我們入門實戰六的內容，如果不太清楚CNN可以再去回顧一下。
本博文資料集。

程式碼部分

import os
os.environ["KMP_DUPLICATE_LIB_OK"]="TRUE"

import tensorflow as tf
import numpy as np
from PIL import Image
import os
import random
import time
 
#驗證碼圖片的存放路徑
CAPTCHA_IMAGE_PATH = 
 './1CNN/Number_app/datas/train/'
#驗證碼圖片的寬度
CAPTCHA_IMAGE_WIDHT = 160
#驗證碼圖片的高度
CAPTCHA_IMAGE_HEIGHT = 60
 
CHAR_SET_LEN = 10
CAPTCHA_LEN = 4
 
#60%的驗證碼圖片放入訓練集中
TRAIN_IMAGE_PERCENT = 0.8
#訓練集，用於訓練的驗證碼圖片的檔名
TRAINING_IMAGE_NAME = []
#驗證集，用於模型驗證的驗證碼圖片的檔名
VALIDATION_IMAGE_NAME = []

#存放訓練好的模型的路徑
MODEL_SAVE_PATH = 
 './1CNN/Number_app/models/'

def get_image_file_name(imgPath=CAPTCHA_IMAGE_PATH):
    fileName = []
    for filePath in os.listdir(imgPath):
        captcha_name = filePath.split('/')[-1]
        fileName.append(captcha_name)
    return fileName
    
#將驗證碼轉換為訓練時用的標籤向量，維數是 40   
#例如，如果驗證碼是 ‘0296’ ，則對應的標籤是
# [1 0 0 0 0 0 0 0 0 0 

#  0 0 1 0 0 0 0 0 0 0
#  0 0 0 0 0 0 0 0 0 1
#  0 0 0 0 0 0 1 0 0 0]
def name2label(name):
    label = np.zeros(CAPTCHA_LEN * CHAR_SET_LEN)
    for i, c in enumerate(name):
        idx = i*CHAR_SET_LEN + ord(c) - ord('0')
        label[idx] = 1
    return label
    

#取得驗證碼圖片的資料以及它的標籤        
def get_datas_and_labels(fileName, filePath=CAPTCHA_IMAGE_PATH):
    train_images = []
    train_labels= []
    for e in fileName:
        pathName = os.path.join(CAPTCHA_IMAGE_PATH, e)
        img = Image.open(pathName)
        #轉為灰度圖
        img = img.convert("L")       
        image_array = np.array(img)    
        image_data = image_array/255
        image_label = name2label(e[0:CAPTCHA_LEN])
        #image_label = image_label.reshape(-1,10)
        train_images.append(image_data)
        train_labels.append(image_label)
    train_images = np.array(train_images)
    train_labels = np.array(train_labels)
    return train_images, train_labels

x = tf.placeholder("float", shape=[None,60,160],name="x")  
#訓練標籤資料  
y_ = tf.placeholder("float", shape=[None, 40],name="y_") 

x_image = tf.reshape(x, [-1,60,160,1])  
conv1_weights = tf.get_variable("conv1_weights", [5, 5, 1, 16], initializer=tf.truncated_normal_initializer(stddev=0.1)) #過濾器大小為5*5, 當前層深度為1， 過濾器的深度為32  
conv1_biases = tf.get_variable("conv1_biases", [16], initializer=tf.constant_initializer(0.0))  

conv1 = tf.nn.conv2d(x_image, conv1_weights, strides=[1, 1, 1, 1], padding='SAME') #移動步長為1, 使用全0填充  
relu1 = tf.nn.relu( tf.nn.bias_add(conv1, conv1_biases) ) #啟用函式Relu去線性化  

#第二層：最大池化層  
#池化層過濾器的大小為2*2, 移動步長為2，使用全0填充  
pool1 = tf.nn.max_pool(relu1, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')  

#第三層：卷積層  
conv2_weights = tf.get_variable("conv2_weights", [5, 5, 16, 32], initializer=tf.truncated_normal_initializer(stddev=0.1)) #過濾器大小為5*5, 當前層深度為32， 過濾器的深度為64  
conv2_biases = tf.get_variable("conv2_biases", [32], initializer=tf.constant_initializer(0.0))  
conv2 = tf.nn.conv2d(pool1, conv2_weights, strides=[1, 1, 1, 1], padding='SAME') #移動步長為1, 使用全0填充  
relu2 = tf.nn.relu( tf.nn.bias_add(conv2, conv2_biases) )  

#第四層：最大池化層  
#池化層過濾器的大小為2*2, 移動步長為2，使用全0填充  
pool2 = tf.nn.max_pool(relu2, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')  

#第五層：卷積層  
conv3_weights = tf.get_variable("conv3_weights", [5, 5, 32, 64], initializer=tf.truncated_normal_initializer(stddev=0.1)) #過濾器大小為5*5, 當前層深度為32， 過濾器的深度為64  
conv3_biases = tf.get_variable("conv3_biases", [64], initializer=tf.constant_initializer(0.0))  
conv3 = tf.nn.conv2d(pool2, conv3_weights, strides=[1, 1, 1, 1], padding='SAME') #移動步長為1, 使用全0填充  
relu3 = tf.nn.relu(tf.nn.bias_add(conv3, conv3_biases) )  

#第六層：最大池化層  
#池化層過濾器的大小為2*2, 移動步長為2，使用全0填充  
pool3 = tf.nn.max_pool(relu3, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')  
#第七層：全連線層  
fc1_weights = tf.get_variable("fc1_weights", [8 * 20 * 64, 1024], initializer=tf.truncated_normal_initializer(stddev=0.1)) #7*7*64=3136把前一層的輸出變成特徵向量  
fc1_baises = tf.get_variable("fc1_baises", [1024], initializer=tf.constant_initializer(0.1))  
pool3_vector = tf.reshape(pool3, [-1, 8 * 20 * 64])  
fc1 = tf.nn.relu(tf.matmul(pool3_vector, fc1_weights) + fc1_baises)  
  
#為了減少過擬合，加入Dropout層  
keep_prob = tf.placeholder(tf.float32,name="keep_prob") 
fc1_dropout = tf.nn.dropout(fc1, keep_prob)  

#第八層：全連線層  
fc2_weights = tf.get_variable("fc2_weights", [1024, 40], initializer=tf.truncated_normal_initializer(stddev=0.1)) #神經元節點數1024, 分類節點10  
fc2_biases = tf.get_variable("fc2_biases", [40], initializer=tf.constant_initializer(0.1))  
fc2 = (tf.matmul(fc1_dropout, fc2_weights) + fc2_biases) 

loss = tf.reduce_mean(tf.nn.sigmoid_cross_entropy_with_logits(labels=y_, logits=fc2))



predict = tf.reshape(fc2, [-1, CAPTCHA_LEN, CHAR_SET_LEN], name='predict')
labels = tf.reshape(y_, [-1, CAPTCHA_LEN, CHAR_SET_LEN], name='labels')
#預測結果
#請注意 predict_max_idx 的 name，在測試model時會用到它
predict_max_idx = tf.argmax(predict, axis=2, name='predict_max_idx')
labels_max_idx = tf.argmax(labels, axis=2, name='labels_max_idx')
predict_correct_vec = tf.equal(predict_max_idx, labels_max_idx)
accuracy = tf.reduce_mean(tf.cast(predict_correct_vec, tf.float32))
#第七層：輸出層  


train_step = tf.train.AdamOptimizer(0.002).minimize(loss)

if __name__ == '__main__':    
    image_filename_list = get_image_file_name(CAPTCHA_IMAGE_PATH)
    np.random.shuffle(image_filename_list)#window 平臺這條語句一定不能少。。
    lens = len(image_filename_list)
    seq = 0.8
    lens1 = int(seq*lens)
    train_filename_list = image_filename_list[:lens1]
    test_filename_list = image_filename_list[lens1:]
    print(lens,lens1)

    train_images, train_labels = get_datas_and_labels(fileName=train_filename_list)
    print(train_filename_list[0],train_images.shape,
    np.argmax(train_labels[0,:10]),np.argmax(train_labels[0,10:20]),np.argmax(train_labels[0,20:30]),np.argmax(train_labels[0,30:]))

    with tf.Session() as sess:

    #開始訓練  
        srun = sess.run
        srun(tf.global_variables_initializer())
        saver = tf.train.Saver()
        
        for i in range(3001):  
            start_step = i*100 % 7960
            stop_step = start_step+100

            batch_x, batch_y = train_images[start_step:stop_step], train_labels[start_step:stop_step]
            srun(train_step,feed_dict={x: batch_x, y_: batch_y, keep_prob: 0.8}) #訓練階段使用80%的Dropout  
            if i%10 == 0:  
                loss_val = srun(loss,{x: batch_x, y_: batch_y, keep_prob: 1.0})
                acc_val = sess.run(accuracy, feed_dict={x:train_images[:200], y_: train_labels[:200], keep_prob:1.0})
                print(i,loss_val,acc_val)
                if acc_val > 0.6:
                    saver.save(sess, MODEL_SAVE_PATH+"crack_captcha.model", global_step=i)

執行結果

0 7.2514677 0.0975
10 0.3490238 0.09375
20 0.32853785 0.11125
30 0.3260678 0.0975
...
150 0.32142633 0.14
160 0.3182468 0.145
170 0.30834803 0.24
180 0.2962727 0.3125
190 0.29101092 0.33
200 0.2805277 0.3525
210 0.26561457 0.385
220 0.2575577 0.40375
230 0.24210992 0.43375
240 0.23269977 0.47625
250 0.22842664 0.4925
260 0.21917553 0.5425
270 0.22002003 0.52875
280 0.20558219 0.54375
290 0.21356806 0.54125
300 0.2039287 0.56
310 0.20335045 0.55625
320 0.19401187 0.5975
330 0.19049801 0.65625
...
1480 0.0026436544 0.9925
1490 0.0020101557 0.99375
...
1680 0.0016069501 1.0
1690 0.0010696264 0.99875
1700 0.0016226814 0.99125
1710 0.0021925105 0.99375
1720 0.0012222779 0.99875

結果分析
在訓練1000步後，訓練集200組資料的準確率到達99%，表明此網路結構的優異性，可以在此基礎上做數字驗證碼的破解工作。

[TensorFlow深度學習深入]實戰二·使用CNN網路識別破解數字驗證碼

[TensorFlow深度學習深入]實戰二·使用CNN網路識別破解數字驗證碼參考部落格。在此基礎上做了小修改。其中CNN網路部分仿照我們入門實戰六的內容，如果不太清楚CNN可以再去回顧一下。本博文資料集。程式碼部分 import os os.environ["KMP_D

[TensorFlow深度學習深入]實戰三·分別使用DNN,CNN與RNN(LSTM)做文字情感分析(機器如何讀懂人心)

[TensorFlow深度學習深入]實戰三·使用Word2Vec與RNN(LSTM)做文字情感分析(機器如何讀懂人心) 用到了 DNN CNN Word2Vec RNN(LSTM) 不太清楚的可以回顧我們之前的博文。使用了全連線,卷積神經網路與迴

[TensorFlow深度學習深入]實戰一·使用embedding_lookup模組對Word2Vec訓練儲存與簡單使用

[TensorFlow深度學習深入]實戰一·使用embedding_lookup模組對Word2Vec訓練儲存與簡單使用 Word2Vec簡介 One hot representation用來表示詞向量非常簡單，但是卻有很多問題。最大的問題是我們的詞彙表一般都非常大，比

Tensorflow深度學習筆記（二）--BPNN手寫數字識別視覺化

資料集：MNIST 啟用函式：Relu 損失函式：交叉熵 Optimizer：AdamOptimizer 視覺化工具：tensorboad 迭代21epoch，accuracy結果如下： Iter 16,Testing Accuracy:

[TensorFlow深度學習入門]實戰十二·使用DNN網路實現自動編碼器

[TensorFlow深度學習入門]實戰十二·使用DNN網路實現自動編碼器測試程式碼 import os os.environ["KMP_DUPLICATE_LIB_OK"]="TRUE" import tensorflow as tf from tensorflow

[深度學習入門]實戰二·使用TensorFlow擬合直線

[深度學習入門]實戰二·使用TensorFlow擬合直線問題描述擬合直線 y =（2x -1） + 0.1(-1到1的隨機值) 給定x範圍（0，3）可以使用學習框架建議使用 y = w * x + b 網路模型生成資料 import nu

[TensorFlow深度學習入門]實戰九·用CNN做科賽網TibetanMNIST藏文手寫數字資料集準確率98%+

[TensorFlow深度學習入門]實戰九·用CNN做科賽網TibetanMNIST藏文手寫數字資料集準確率98.8%+ 我們在博文，使用CNN做Kaggle比賽手寫數字識別準確率99%+，在此基礎之上，我們進行對科賽網TibetanMNIST藏文手寫數字資料集訓練，來驗證網路的正確性。

[TensorFlow深度學習入門]實戰六·用CNN做Kaggle比賽手寫數字識別準確率99%+

[TensorFlow深度學習入門]實戰六·用CNN做Kaggle比賽手寫數字識別準確率99%+ 參考部落格地址本部落格採用Lenet5實現，也包含TensorFlow模型引數儲存與載入參考我的博文，實用性比較好。在訓練集準確率99.85%，測試訓練集準確率99%+。訓練

Tensorflow深度學習之十二：基礎圖像處理之二

fcm 數字 ssi port con tty .net term file Tensorflow深度學習之十二：基礎圖像處理之二 from：https://blog.csdn.net/davincil/article/details/76598474 首先放出

[TensorFlow深度學習入門]實戰四·邏輯迴歸鳶尾花進行分類（對比均方根誤差與softmax交叉熵誤差區別）

[TensorFlow深度學習入門]實戰四·邏輯迴歸鳶尾花進行分類問題描述資料集鳶尾花資料集下載地址鳶尾花資料集包含四個特徵和一個標籤。這四個特徵確定了單株鳶尾花的下列植物學特徵： 1、花萼長度 2、花萼寬度 3、花瓣長度 4、花瓣寬度該標籤確定了鳶尾花品種，

[TensorFlow深度學習入門]實戰十一·用雙向BiRNN(LSTM)做手寫數字識別準確率99%+

[TensorFlow深度學習入門]實戰十一·用雙向BiRNN(LSTM)做手寫數字識別準確率99%+ 此博文是我們在完成實戰五·用RNN(LSTM)做手寫數字識別的基礎上使用BiRNN(LSTM)結構，進一步提升模型的準確率，1000steps準確率達到99%。首先我們先

[TensorFlow深度學習入門]實戰十·用RNN(LSTM)做時間序列預測（曲線擬合）

[TensorFlow深度學習入門]實戰十·用RNN(LSTM)做時間序列預測（曲線擬合） %matplotlib inline import os os.environ["KMP_DUPLICATE_LIB_OK"]="TRUE" import numpy as np import

[TensorFlow深度學習入門]實戰八·簡便方法實現TensorFlow模型引數儲存與載入（pb方式）

[TensorFlow深度學習入門]實戰八·簡便方法實現TensorFlow模型引數儲存與載入（pb方式）在上篇博文中，我們探索了TensorFlow模型引數儲存與載入實現方法採用的是儲存ckpt的方式。這篇博文我們會使用儲存為pd格式檔案來實現。首先，我會在上篇博文基礎上，實現由c

[TensorFlow深度學習入門]實戰七·簡便方法實現TensorFlow模型引數儲存與載入（ckpt方式）

[TensorFlow深度學習入門]實戰七·簡便方法實現TensorFlow模型引數儲存與載入（ckpt方式） TensorFlow模型訓練的好網路引數如果想重複高效利用，模型引數儲存與載入是必須掌握的模組。本文提供一種簡單容易理解的方式來實現上述功能。參考部落格地址備註：本文采用的

[TensorFlow深度學習入門]實戰五·用RNN(LSTM)做手寫數字識別準確率98%+

參考部落格地址，修復了一個小Bug，收斂速度和準確率都略微提升。使用此模型在Kaggle比賽準確率98%+ import os os.environ["KMP_DUPLICATE_LIB_OK"]="TRUE" import time import tensorflow as tf im

Tensorflow深度學習之十二：基礎影象處理之二

首先放出原始影象： 1、影象的翻轉 import tensorflow as tf import cv2 # 這裡定義一個tensorflow讀取的圖片格式轉換為opencv讀取的圖片格式的函式 # 請注意： # 在tensorflow中，一個畫素

分享《TensorFlow深度學習》高清中文版PDF+英文版PDF+源代碼

表現文本書籍 tensor ado 源代碼更多 col mar 下載：https://pan.baidu.com/s/1Z5xJw4WWbJmJJlF4zvSXlA 更多資料：http://blog.51cto.com/14050756 《TensorFlow深度學習

使用Tensorflow構建和訓練自己的CNN來做簡單的驗證碼識別

Tensorflow是目前最流行的深度學習框架，我們可以用它來搭建自己的卷積神經網路並訓練自己的分類器，本文介紹怎樣使用Tensorflow構建自己的CNN，怎樣訓練用於簡單的驗證碼識別的分類器。本文假設你已經安裝好了Tensorflow，瞭解過CNN的一些知

Python爬蟲專案實戰3 | 圖片文字識別（以驗證碼識別為例）

1.專案背景我在實習過程中，當我抓取環保平臺相關資料時，常常發現有圖片的情況，比如以下這種圖片，所以抓取這種圖片中的資訊是我進行圖片文字識別的動力： 2.專案思路因為在某一網站中有大量這種想要抓取的圖片，所以我的思路是， 1.先抓取這些圖片的名稱和URL； 2.然後再根

[Keras深度學習淺嘗]實戰二·CNN實現Fashion MNIST 資料集分類

[Keras深度學習淺嘗]實戰二·CNN實現Fashion MNIST 資料集分類與我們上篇博文[Keras深度學習淺嘗]實戰一結構相同，修改的地方有，定義網路與模型訓練兩部分，可以對比著來看。通過使用CNN結構，預測準確率略有提升，可以通過修改超引數以獲得更優結果。程式碼部分

[TensorFlow深度學習深入]實戰二·使用CNN網路識別破解數字驗證碼

[TensorFlow深度學習深入]實戰二·使用CNN網路識別破解數字驗證碼

相關推薦