08-人臉識別-FaceNet-classify.py代碼閱讀（說明見注釋）

本文轉載自查看原文 2018-04-19 22:43 2487 人臉識別-face_recognition/ numpy/ Python/ TensorFlow
"""An example of how to use your own dataset to train a classifier that recognizes people.
"""
# MIT License
# 
# Copyright (c) 2016 David Sandberg
# 
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
# 
# The above copyright notice and this permission notice shall be included in all
# copies or substantial portions of the Software.
# 
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.

# @ 調用格式：
# @
# @ 訓練模型記住人臉（不是訓練網絡，網絡在這之前已經先訓練好了）。
# @ ../lfw/ 是lfw數據集經過 mtcnn 截取以后的結果。否則會影響效果（去除數據集中的人臉外部干擾）
# @     python classifier.py TRAIN ../lfw/ 20170511-185253/ train_20180419_2048.pkl 
# @
# @ 測試模型記住人臉的結果。（../data 是測試用的圖的路徑。）
# @     python classifier.py CLASSIFY ../data/ 20170511-185253/ train_20180419_2048.pkl 



from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

import tensorflow as tf
import numpy as np
import argparse
import facenet
import os
import sys
import math
import pickle
from sklearn.svm import SVC

# @ args內中參數見函數 parse_arguments
def main(args):
	# @ 聲明一個計算圖，都這么寫，沒有就是默認一個。
    with tf.Graph().as_default():
		# @ 聲明一個 Session
        with tf.Session() as sess:
		
			# @ Part I
			# @ 這部分是計算人臉的 embedding 特征。費時。 
			# @ 
			
            # @ 加隨機數seed，調用np.random.random()的結果都會相同。
            np.random.seed(seed=args.seed)
            
            if args.use_split_dataset:
                dataset_tmp = facenet.get_dataset(args.data_dir)
                train_set, test_set = split_dataset(dataset_tmp, args.min_nrof_images_per_class, args.nrof_train_images_per_class)
                if (args.mode=='TRAIN'):
                    dataset = train_set
                elif (args.mode=='CLASSIFY'):
                    dataset = test_set
            else:
                dataset = facenet.get_dataset(args.data_dir)

            # Check that there are at least one training image per class
			# @ cls.image_paths 是每張圖的路徑，包含文件名。
            for cls in dataset:
                assert(len(cls.image_paths)>0, 'There must be at least one image for each class in the dataset')            

            # @ 分離出圖片路徑名paths，和類型labels（人臉所屬人名）
            paths, labels = facenet.get_image_paths_and_labels(dataset)
            
            print('Number of classes: %d' % len(dataset))
            print('Number of images: %d' % len(paths))
            
            # Load the model
            # @ 這里加的 model 使用於生成人臉的 embedding 特征的網絡。
			# @ 這個網絡是事先已經生成好的。
			# @ 網絡可以根據運行的平台，設計成不同大小。比如基於GoogleNet/AlexNet等
			print('Loading feature extraction model')
            facenet.load_model(args.model)
            
            # Get input and output tensors
			# @ TensorFlow的參數准備。embeddings 是網絡的輸出，是后續分類的輸入。
            images_placeholder = tf.get_default_graph().get_tensor_by_name("input:0")
            embeddings = tf.get_default_graph().get_tensor_by_name("embeddings:0")
            phase_train_placeholder = tf.get_default_graph().get_tensor_by_name("phase_train:0")
            embedding_size = embeddings.get_shape()[1]
            
            # Run forward pass to calculate embeddings
            print('Calculating features for images')
            nrof_images = len(paths) # @ 圖片總數
            nrof_batches_per_epoch = int(math.ceil(1.0*nrof_images / args.batch_size))
            emb_array = np.zeros((nrof_images, embedding_size))
            for i in range(nrof_batches_per_epoch):
                start_index = i*args.batch_size
                end_index = min((i+1)*args.batch_size, nrof_images)
                paths_batch = paths[start_index:end_index]
                images = facenet.load_data(paths_batch, False, False, args.image_size)
                feed_dict = { images_placeholder:images, phase_train_placeholder:False }
                emb_array[start_index:end_index,:] = sess.run(embeddings, feed_dict=feed_dict)
            
			# @ emb_array 是 embedding 結果。一個 embedding 有 18 維。
			# @ 接下來就是用機器學習的方法分類。
            classifier_filename_exp = os.path.expanduser(args.classifier_filename)

			# @ Part II 也較費時。
			# @ 這部分是訓練分類人臉的機器學習模型，這里使用的SVC，是SVM的一種。
			# @ 若是 CLASSIFY ，則是加載訓練結果，建立 SVC 分類器。
			
            if (args.mode=='TRAIN'):
                # Train classifier
				# @ SVC是SVM的一種Type，是用來的做分類的；同樣還有SVR，是SVM的另一種Type，是用來的做回歸的。
                print('Training classifier')
                model = SVC(kernel='linear', probability=True)
                model.fit(emb_array, labels) # @ 訓練過程
            
				# @ 訓練結束，保存數據
                # Create a list of class names
                class_names = [ cls.name.replace('_', ' ') for cls in dataset]

                # Saving classifier model
                with open(classifier_filename_exp, 'wb') as outfile:
                    pickle.dump((model, class_names), outfile)
                print('Saved classifier model to file "%s"' % classifier_filename_exp)
                
            elif (args.mode=='CLASSIFY'):
                # Classify images
                print('Testing classifier')
				# @ 加載數據，建立分類器
                with open(classifier_filename_exp, 'rb') as infile:
                    (model, class_names) = pickle.load(infile)

                print('Loaded classifier model from file "%s"' % classifier_filename_exp)

				# @ 預測，標簽結果應該是 one_hot 的。
                predictions = model.predict_proba(emb_array)
                best_class_indices = np.argmax(predictions, axis=1) # @ 輸出每列最大的序號。
                best_class_probabilities = predictions[np.arange(len(best_class_indices)), best_class_indices]
                
                for i in range(len(best_class_indices)):
                    print('%4d  %s: %.3f' % (i, class_names[best_class_indices[i]], best_class_probabilities[i]))
                    
				# @ 評估結果。labels 是測試集的實際結果，best_class_indices是預測結果。
                accuracy = np.mean(np.equal(best_class_indices, labels))
                print('Accuracy: %.3f' % accuracy)
                
# @ 將數據集分成訓練集和測試集
def split_dataset(dataset, min_nrof_images_per_class, nrof_train_images_per_class):
    train_set = []
    test_set = []
    for cls in dataset:
        paths = cls.image_paths
        # Remove classes with less than min_nrof_images_per_class
        if len(paths)>=min_nrof_images_per_class:
            np.random.shuffle(paths)
            train_set.append(facenet.ImageClass(cls.name, paths[:nrof_train_images_per_class]))
            test_set.append(facenet.ImageClass(cls.name, paths[nrof_train_images_per_class:]))
    return train_set, test_set
	
# @ 命令行參數，使用的系統庫 argparse
# @ ** 寫法值得記住 **
def parse_arguments(argv):
    parser = argparse.ArgumentParser()
    
    parser.add_argument('mode', type=str, choices=['TRAIN', 'CLASSIFY'],
        help='Indicates if a new classifier should be trained or a classification ' + 
        'model should be used for classification', default='CLASSIFY')
    parser.add_argument('data_dir', type=str,
        help='Path to the data directory containing aligned LFW face patches.')
    parser.add_argument('model', type=str, 
        help='Could be either a directory containing the meta_file and ckpt_file or a model protobuf (.pb) file')
    parser.add_argument('classifier_filename', 
        help='Classifier model file name as a pickle (.pkl) file. ' + 
        'For training this is the output and for classification this is an input.')
    parser.add_argument('--use_split_dataset', 
        help='Indicates that the dataset specified by data_dir should be split into a training and test set. ' +  
        'Otherwise a separate test set can be specified using the test_data_dir option.', action='store_true')
    parser.add_argument('--test_data_dir', type=str,
        help='Path to the test data directory containing aligned images used for testing.')
    parser.add_argument('--batch_size', type=int,
        help='Number of images to process in a batch.', default=90)
    parser.add_argument('--image_size', type=int,
        help='Image size (height, width) in pixels.', default=160)
    parser.add_argument('--seed', type=int,
        help='Random seed.', default=666)
    parser.add_argument('--min_nrof_images_per_class', type=int,
        help='Only include classes with at least this number of images in the dataset', default=20)
    parser.add_argument('--nrof_train_images_per_class', type=int,
        help='Use this number of images from each class for training and the rest for testing', default=10)
    
    return parser.parse_args(argv)

# @ 主函數
# @ sys.argv[1:] 就是命令行輸入的 classify.py 后面的所有字符串，以空格分隔。
if __name__ == '__main__':
    main(parse_arguments(sys.argv[1:]))
免責聲明！

本站轉載的文章為個人學習借鑒使用，本站對版權不負任何法律責任。如果侵犯了您的隱私權益，請聯系本站郵箱yoyou2525@163.com刪除。
猜您在找 facenet 人臉識別（一）人臉識別FaceNet+TensorFlow FaceNet實現人臉檢測和識別 facenet 進行人臉識別測試 facenet 人臉識別（二）——創建人臉庫搭建人臉識別系統用 Google 的 FaceNet 做人臉識別---極客幫課程筆記 FaceNet---深度學習與人臉識別的二次結合 TensorFlow環境人臉識別 FaceNet 應用（一）驗證測試集【深度學習】使用MTCNN+FaceNet進行人臉識別第三十七節、人臉檢測MTCNN和人臉識別Facenet(附源碼)