tensorflow-CNN例項影象分類

阿新 • • 發佈：2019-02-05

import numpy as np
from scipy.misc import imread,imresize
import glob
import matplotlib.pyplot as plt
import os
import tensorflow as tf
from tensorflow.python.framework import ops
ops.reset_default_graph()
from tensorflow.python.framework.graph_util import convert_variables_to_constants


def read_image 
(path):  # 讀取要訓練的圖片
    imgs = []
    labels = []
    # 資料夾下的檔名
    cate = [path + x for x in os.listdir(path)]  # 獲取絕對路徑
    for idx, folder in (enumerate(cate)):
        print (idx, folder)
        for im in glob.glob(folder + '/*.png'):  # glob查詢檔案路徑
            # print ('reading the images:%s'%(im)) 

            img = imread(im)

            img = imresize(img, (w, h))
            imgs.append(img)
            labels.append(idx)
    return np.asarray(imgs), np.asarray(labels, np.int32)

#網路引數設定
def cnn_param_set():
    conv1_weight = tf.Variable(tf.truncated_normal([3, 3, num_channels, conv1_features],
                                                   stddev=0.1 
, dtype=tf.float32), name='conv1_weight')
    conv1_bias = tf.Variable(tf.zeros([conv1_features], dtype=tf.float32), name='conv1_bias')
    conv2_weight = tf.Variable(tf.truncated_normal([3, 3, conv1_features, conv2_features],
                                                   stddev=0.1, dtype=tf.float32), name='conv2_weight')
    conv2_bias = tf.Variable(tf.zeros([conv2_features], dtype=tf.float32), name='conv2_bias')

    # fully connected variables 全連線層
    resulting_width = image_width // (max_pool_size1 * max_pool_size2)
    print(resulting_width)
    resulting_height = image_height // (max_pool_size1 * max_pool_size2)
    print (image_height)
    print (resulting_height)
    full1_input_size = resulting_width * resulting_height * conv2_features
    print (full1_input_size)
    full1_weight = tf.Variable(tf.truncated_normal([full1_input_size, fully_connected_size1],
                                                   stddev=0.1, dtype=tf.float32), name='full1_weight')
    full1_bias = tf.Variable(tf.truncated_normal([fully_connected_size1], stddev=0.1, dtype=tf.float32)
                             , name='full1_bias')

    full2_weight = tf.Variable(tf.truncated_normal([fully_connected_size1, target_size],
                                                   stddev=0.1, dtype=tf.float32), name='full2_weight')
    full2_bias = tf.Variable(tf.truncated_normal([target_size], stddev=0.1, dtype=tf.float32), name='full2_bias')


def my_conv_net(input_data):
    # First Conv-ReLU-MaxPool Layer
    conv1 = tf.nn.conv2d(input_data, conv1_weight, strides=[1, 1, 1, 1], padding='SAME', name='conv1')

    relu1 = tf.nn.relu(tf.nn.bias_add(conv1, conv1_bias))
    max_pool1 = tf.nn.max_pool(relu1, ksize=[1, max_pool_size1, max_pool_size1, 1],
                               strides=[1, max_pool_size1, max_pool_size1, 1], padding='SAME', name='max_pool1')
    print (max_pool1.shape)
    # Second Conv-ReLU-MaxPool Layer
    conv2 = tf.nn.conv2d(max_pool1, conv2_weight, strides=[1, 1, 1, 1], padding='SAME', name='conv2')
    relu2 = tf.nn.relu(tf.nn.bias_add(conv2, conv2_bias))
    max_pool2 = tf.nn.max_pool(relu2, ksize=[1, max_pool_size2, max_pool_size2, 1],
                               strides=[1, max_pool_size2, max_pool_size2, 1], padding='SAME', name='max_pool2')
    print (max_pool2.shape)
    # third Conv-ReLU-MaxPool Layer

    # Transform Output into a 1xN layer for next fully connected layer
    final_conv_shape = max_pool2.get_shape().as_list()
    print(final_conv_shape)
    final_shape = final_conv_shape[1] * final_conv_shape[2] * final_conv_shape[3]  # [100, 7, 7, 50]
    flat_output = tf.reshape(max_pool2, [-1, final_shape])  # 100*2450

    # First Fully Connected Layer
    fully_connected1 = tf.nn.relu(tf.add(tf.matmul(flat_output, full1_weight), full1_bias),
                                  name='fully_connected1')  # 矩陣相乘
    print('full1: ' + str(fully_connected1))
    # Second Fully Connected Layer
    final_model_output = tf.add(tf.matmul(fully_connected1, full2_weight), full2_bias, name='final_model_output')
    print (final_model_output)
    return (final_model_output)
#準確度計算
def get_accuracy(logits,targets):
    batch_predictions = np.argmax(logits,axis=1)
    num_correct = np.sum(np.equal(batch_predictions,targets))
    return(100.* num_correct/batch_predictions.shape[0])

def train():
    # training
    import datetime
    begin = datetime.datetime.now()

    train_loss = []
    train_acc = []
    test_acc = []
    for i in range(generations):
        rand_index = np.random.choice(len(x_train), size=batch_size)  # 隨機選擇size個數
        print
        rand_x = x_train[rand_index]  # (100, 28, 28)
        rand_y = y_train[rand_index]
        train_dict = {x_input: rand_x, y_target: rand_y}

        sess.run(train_step, feed_dict=train_dict)
        temp_train_loss, temp_train_preds = sess.run([loss, prediction], feed_dict=train_dict)
        loss1_temp = sess.run([loss1], feed_dict=train_dict)
        temp_train_acc = get_accuracy(temp_train_preds, rand_y)
        if (i) % eval_every == 0:
            eval_index = np.random.choice(len(x_val), size=evaluation_size)
            eval_x = x_val[eval_index]
            eval_y = y_val[eval_index]
            test_dict = {eval_input: eval_x, eval_target: eval_y}
            temp_test_loss = sess.run(loss_test, feed_dict=test_dict)
            test_preds = sess.run(test_prediction, feed_dict=test_dict)
            temp_test_acc = get_accuracy(test_preds, eval_y)

            # Record and print results
            train_loss.append(temp_train_loss)
            train_acc.append(temp_train_acc)
            test_acc.append(temp_test_acc)
            acc_and_loss = [(i + 1), temp_train_loss, temp_train_acc, temp_test_acc]
            acc_and_loss = [np.round(x, 2) for x in acc_and_loss]
            print('Generation # {}. Train Loss: {:.2f}. Train Acc (Test Acc): {:.2f} ({:.2f})'.format(*acc_and_loss))
            print('Generation # test Loss: ', temp_test_loss)
    end = datetime.datetime.now()

    print(end - begin)

def loss_accuray_plt():
    # Matlotlib code to plot the loss and accuracies
    eval_indices = range(0, generations, eval_every)
    # Plot loss over time
    plt.plot(eval_indices, train_loss, 'k-')
    plt.title('Softmax Loss per Generation')
    plt.xlabel('Generation')
    plt.ylabel('Softmax Loss')
    plt.show()

    # Plot train and test accuracy
    plt.plot(eval_indices, train_acc, 'k-', label='Train Set Accuracy')
    plt.plot(eval_indices, test_acc, 'r--', label='Test Set Accuracy')
    plt.title('Train and Test Accuracy')
    plt.xlabel('Generation')
    plt.ylabel('Accuracy')
    plt.legend(loc='lower right')
    plt.show()

if __name__ == "__main__":
    path = u'F:/PycharmWorkspace/ipython/tensorflow/station_data/'
    # 將所有的圖片resize成32*64
    w = 32
    h = 64
    c = 4
    #讀取圖片
    data, label = read_image(path)
    #將圖片順序打亂
    num_example = data.shape[0]
    print (num_example)
    print (label)
    print ((set(label)))
    arr = np.arange(num_example)
    np.random.shuffle(arr)
    data = data[arr]
    label = label[arr]

    # 將所有資料分為訓練集和驗證集
    ratio = 0.8
    s = np.int(num_example * ratio)
    x_train = data[:s]
    y_train = label[:s]
    x_val = data[s:]
    y_val = label[s:]

    # 設定模型引數
    generations = 1000
    batch_size = 200
    evaluation_size = 500
    image_width = w
    image_height = h
    print(image_height)
    num_channels = 4  # greyscale = 1 channel 灰度影象通道是1
    target_size = len(set(label))
    print (target_size)
    learning_rate = 0.001
    eval_every = 5
    conv1_features = 32  # conv1卷積核數
    conv2_features = 64  # conv2卷積核數
    max_pool_size1 = 2  # NxN window for 1st max pool layer
    max_pool_size2 = 2  # NxN window for 2nd max pool layer
    max_pool_size3 = 2  # NxN window for 2nd max pool layer
    fully_connected_size1 = 512

    #cnn佔位符
    x_input_shape = (None, w, h, c)
    x_input = tf.placeholder(tf.float32, shape=x_input_shape, name='x_input')
    y_target = tf.placeholder(tf.int32, shape=[None, ], name='y_target')
    print(x_input)
    print(y_target)
    eval_input_shape = (None, w, h, c)
    eval_input = tf.placeholder(tf.float32, shape=eval_input_shape, name='eval_input')
    eval_target = tf.placeholder(tf.int32, shape=[None, ], name='eval_target')

    # 網路引數設定
    cnn_param_set()
    #網路模型：
    model_output = my_conv_net(x_input)
    test_model_output = my_conv_net(eval_input)

    #損失函式
    loss = tf.reduce_mean(tf.nn.sparse_softmax_cross_entropy_with_logits(logits=model_output, labels=y_target),name='loss')
    loss_test = tf.reduce_mean(tf.nn.sparse_softmax_cross_entropy_with_logits(logits=test_model_output, labels=eval_target))
    #預測
    prediction = tf.nn.softmax(model_output,name="softmax")
    print (prediction)
    prediction_labels = tf.argmax(prediction, axis=1, name='output')
    print(prediction_labels)
    test_prediction = tf.nn.softmax(test_model_output)

    # Create an optimizer
    my_optimizer = tf.train.AdamOptimizer(learning_rate)
    train_step = my_optimizer.minimize(loss)

    # Initialize Variables
    init = tf.global_variables_initializer()
    sess.run(init)
    #訓練
    train()
    #畫出損失和預測的變化
    loss_accuray_plt()

    #儲存訓練的模型
    graph = convert_variables_to_constants(sess, sess.graph_def, ["softmax"])  # out為儲存網路的最後輸出節點名稱
    tf.train.write_graph(graph, '.', 'graph/graph_train.pb', as_text=False)
    sess.close()

tensorflow-CNN例項影象分類

import numpy as np from scipy.misc import imread,imresize import glob import matplotlib.pyplot as plt import os import tensorflow

tensorflow 學習：用CNN進行影象分類

# -*- coding: utf-8 -*- from skimage import io,transform import glob import os import tensorflow as tf import numpy as np import time path='e:/flower/'

基於tensorflow + Vgg16進行影象分類識別

1. VGG-16介紹 vgg是在Very Deep Convolutional Networks for Large-Scale Image Recognition期刊上提出的。模型可以達到92.7%的測試準確度,在ImageNet的前5位。它的資料集包括1

TensorFlow實現用於影象分類的卷積神經網路（程式碼詳細註釋）

這裡我們採用cifar10作為我們的實驗資料庫。首先下載TensorFlow Models庫，以便使用其中提供的CIFAR-10資料的類。 git clone https://github.com/tensorflow/models.git cd mo

基於tensorflow + Vgg16進行影象分類識別的實驗

影象分類識別目前已經得到了很大的飛躍，特別是15年微軟提出的resnet已經超越人類，能夠對影象中的物體進行更好的識別。為了初步瞭解一下影象分類識別的過程，學習了一下大牛的主頁，發現還是很有意思的。而且從imagenet的角度來說，這個經度還是可以接受的。本實驗主

深度學習 --- CNN的變體在影象分類、影象檢測、目標跟蹤、語義分割和例項分割的簡介（附論文連結）

以上就是卷積神經網路的最基礎的知識了，下面我們一起來看看CNN都是用在何處並且如何使用，以及使用原理，本人還沒深入研究他們，等把基礎知識總結完以後開始深入研究這幾個方面，然後整理在寫成部落格，最近的安排是後面把自然語言處理總結一下，強化學習的總結就先往後推一下。再往後是系統的學習一下演算法和資料

TensorFlow CNN對CIFAR10影象分類2

下載python version import os os.environ['TF_CPP_MIN_LOG_LEVEL']='2' import tensorflow as tf import numpy as np def unpickle(file):

簡單影象分類與識別CNN,Tensorflow,Cifar10(吳恩達Deep Learning)

簡介因最近在學習深度學習，看了網易雲課堂吳恩達的深度學習工程師和李巨集毅的機器學習的課程，對卷積神經網路還是不是很理解。自己在網上搜教程，深度學習的入門程式《MNIST手寫數字識別》,照著寫了一遍跑了一遍。於是在網上下載了cifar資料集, 隨便搭建了一個卷

詳解tensorflow訓練自己的資料集實現CNN影象分類

利用卷積神經網路訓練影象資料分為以下幾個步驟1.讀取圖片檔案2.產生用於訓練的批次3.定義訓練的模型（包括初始化引數，卷積、池化層等引數、網路）4.訓練1 讀取圖片檔案def get_files(filename): class_train = [] label_trai

阿里雲免費GPU+Tensorflow框架下的影象分類例項

主要參看https://yq.aliyun.com/articles/72841?spm=5176.100239.0.0.aLlJGY 1.把下載的程式碼和資料集都上傳到了OSS中，放在資料夾cifar-10-py中或者整理成4個資料夾： check_point:用

TensorFlow小試牛刀(1):CNN影象分類

深度學習不能只是一味的看paper，看原始碼，必須要親自動手寫程式碼。最近好好學了下TensorFlow，順便自己寫了一個簡單的CNN來實現影象分類，也遇到了不少問題，但都一一解決，也算是收穫滿滿。重在實現，不在結果。首先我使用的資料集是CIFAR-10

TensorFlow中利用CNN處理影象總結

看了很多書，也實戰了，但是總想用通俗的語言來講述一下CNN處理的過程，今天我有幸和大家分享一下。首先，卷積神經網路就是至少包含一層的神經網路，該層的功能是：計算輸入f與可配置的卷積核g的卷積，生成輸出。卷積的目的就是把卷積核應用到某個張量的所有點上，通過卷積核的滑動生成新的濾波後的張量。卷

keras+CNN影象分類

我們的深度學習資料集包括1,191張口袋妖怪影象，（存在於口袋妖怪世界中的動物般的生物，流行的電視節目，視訊遊戲和交易卡系列）。我們的目標是使用Keras和深度學習訓練卷積神經網路，以識別和分類這些神奇寶貝。我們將認識到的口袋妖怪包括： Bulbasaur（234影象） Charma

實戰keras——用CNN實現cifar10影象分類

原文：https://blog.csdn.net/zzulp/article/details/76358694 import keras from keras.datasets import cifar10 from keras.models import Sequenti

【計算機視覺必讀乾貨】影象分類、定位、檢測，語義分割和例項分割方法梳理

文章來源：新智元作者：張皓【導讀】本文作者來自南京大學計算機系機器學習與資料探勘所（LAMDA），本文直觀系統地梳理了深度學習在計算機視覺領域四大基本任務中的應用，包括影象分類、定位、檢測、語義分割和例項分割。本文旨在介紹深度學習在計算機視覺領域四大基本任務中的應用，包括分類(圖

keras CNN對CIFAR10影象分類

from keras.datasets import cifar10 from keras.utils import np_utils from keras.models import Sequential from keras.layers import Conv2D, D

基於TensorFlow影象分類實現

train.py 訓練集圖片檔名稱中存在型別即可。根據需分類型別修改# 訓練集生成和# 測試集生成程式碼塊中的讀取方式。 import os import numpy as np import tensorflow as tf from network import Network from

一文詳解計算機視覺五大技術：影象分類、物件檢測、目標跟蹤、語義分割和例項分割

【導讀】目前，計算機視覺是深度學習領域最熱門的研究領域之一。計算機視覺實際上是一個跨領域的交叉學科，包括電腦科學（圖形、演算法、理論、系統、體系結構），數學（資訊檢索、機器學習），工程學（機器人、語音、自然語言處理、影象處理），物理學（光學），生物學（神經科學）和心理學（認知科學）等等。許

詳解計算機視覺五大技術：影象分類、物件檢測、目標跟蹤、語義分割和例項分割...

CNN影象分類-經典網路摘要

一、LeNet-5-------1998年由LeCun在1998年提出，用於手寫數字分類（1）提出了權重共享、特徵圖的概念（2）啟用函式：雙曲正切（3）網路權重初始化：均勻分佈（4）訓練：BP+SGD 二、AlexNet------2

tensorflow-CNN例項影象分類

相關推薦