im2rec.py的解讀以及python高階程式設計的一些知識點

阿新 • • 發佈：2019-01-07

1.mxnet 的im2rec.py註釋

# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements.  See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership.  The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License.  You may obtain a copy of the License at
#
#   http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied.  See the License for the
# specific language governing permissions and limitations
# under the License.

# -*- coding: utf-8 -*-
from __future__ import print_function
import os
import sys

curr_path = os.path.abspath(os.path.dirname(__file__))
sys.path.append(os.path.join(curr_path, "../python"))
import mxnet as mx
import random
import argparse
import cv2
import time
import traceback
from builtins import range

try:
    import multiprocessing
except ImportError:
    multiprocessing = None

#生成器函式，用於遞迴/不遞迴形成圖片目錄
def list_image(root, recursive, exts):
    i = 0
    if recursive:#遞迴多級目錄
        cat = {}
        for path, dirs, files in os.walk(root, followlinks=True):#path dir=os.listdir(path) file:每個資料夾內的檔案
            dirs.sort()
            files.sort()
            for fname in files:
                fpath = os.path.join(path, fname)
                suffix = os.path.splitext(fname)[1].lower()
                if os.path.isfile(fpath) and (suffix in exts):
                    if path not in cat:
                        cat[path] = len(cat)
                    yield (i, os.path.relpath(fpath, root), cat[path])#生成器 返回迭代物件 for 迴圈中自動執行next()
                    i += 1
        for k, v in sorted(cat.items(), key=lambda x: x[1]):#lambda表示式,表示按照第二個維度排序，也就是label的值
            print(os.path.relpath(k, root), v)
    else:#無需遞迴的時候，一級目錄
        for fname in sorted(os.listdir(root)):
            fpath = os.path.join(root, fname)
            suffix = os.path.splitext(fname)[1].lower()#獲取字尾並改成小寫
            if os.path.isfile(fpath) and (suffix in exts):
                yield (i, os.path.relpath(fpath, root), 0)
                i += 1
#將列表寫入檔案.lst
def write_list(path_out, image_list):
    with open(path_out, 'w') as fout:
        for i, item in enumerate(image_list):
            line = '%d\t' % item[0]
            for j in item[2:]:
                line += '%f\t' % j
            line += '%s\n' % item[1]
            fout.write(line)

#生成.lst主要函式
def make_list(args):
    image_list = list_image(args.root, args.recursive, args.exts)#生成器
    image_list = list(image_list)
    if args.shuffle is True:
        random.seed(100)
        random.shuffle(image_list)#打輪順序，很有必要
    N = len(image_list)
    chunk_size = (N + args.chunks - 1) // args.chunks
    for i in range(args.chunks):
        chunk = image_list[i * chunk_size:(i + 1) * chunk_size]
        if args.chunks > 1:
            str_chunk = '_%d' % i
        else:
            str_chunk = ''
        sep = int(chunk_size * args.train_ratio)
        sep_test = int(chunk_size * args.test_ratio)
        if args.train_ratio == 1.0:
            write_list(args.prefix + str_chunk + '.lst', chunk)
        else:
            if args.test_ratio:
                write_list(args.prefix + str_chunk + '_test.lst', chunk[:sep_test])
            if args.train_ratio + args.test_ratio < 1.0:
                write_list(args.prefix + str_chunk + '_val.lst', chunk[sep_test + sep:])
            write_list(args.prefix + str_chunk + '_train.lst', chunk[sep_test:sep_test + sep])

#從.lst中讀取lst以備生成rec
def read_list(path_in):
    with open(path_in) as fin:
        while True:
            line = fin.readline()
            if not line:
                break
            line = [i.strip() for i in line.strip().split('\t')]
            line_len = len(line)
            if line_len < 3:
                print('lst should at least has three parts, but only has %s parts for %s' %(line_len, line))
                continue
            try:
                item = [int(line[0])] + [line[-1]] + [float(i) for i in line[1:-1]]
            except Exception as e:
                print('Parsing lst met error for %s, detail: %s' %(line, e))
                continue
            yield item

#圖片編碼，生成頭+圖片的形式
def image_encode(args, i, item, q_out):
    fullpath = os.path.join(args.root, item[1])

    if len(item) > 3 and args.pack_label:
        header = mx.recordio.IRHeader(0, item[2:], item[0], 0)
    else:
        header = mx.recordio.IRHeader(0, item[2], item[0], 0)#0 label id 0

    if args.pass_through:
        try:
            with open(fullpath, 'rb') as fin:
                img = fin.read()
            s = mx.recordio.pack(header, img)
            q_out.put((i, s, item))
        except Exception as e:
            traceback.print_exc()
            print('pack_img error:', item[1], e)
            q_out.put((i, None, item))
        return

    try:
        img = cv2.imread(fullpath, args.color)
    except:
        traceback.print_exc()
        print('imread error trying to load file: %s ' % fullpath)
        q_out.put((i, None, item))
        return
    if img is None:
        print('imread read blank (None) image for file: %s' % fullpath)
        q_out.put((i, None, item))
        return
    if args.center_crop:
        if img.shape[0] > img.shape[1]:
            margin = (img.shape[0] - img.shape[1]) // 2;
            img = img[margin:margin + img.shape[1], :]
        else:
            margin = (img.shape[1] - img.shape[0]) // 2;
            img = img[:, margin:margin + img.shape[0]]
    if args.resize:
        if img.shape[0] > img.shape[1]:
            newsize = (args.resize, img.shape[0] * args.resize // img.shape[1])
        else:
            newsize = (img.shape[1] * args.resize // img.shape[0], args.resize)
        img = cv2.resize(img, newsize)

    try:
        s = mx.recordio.pack_img(header, img, quality=args.quality, img_fmt=args.encoding)
        q_out.put((i, s, item))
    except Exception as e:
        traceback.print_exc()
        print('pack_img error on file: %s' % fullpath, e)
        q_out.put((i, None, item))
        return

def read_worker(args, q_in, q_out):
    while True:
        deq = q_in.get()
        if deq is None:
            break
        i, item = deq
        image_encode(args, i, item, q_out)

def write_worker(q_out, fname, working_dir):
    pre_time = time.time()
    count = 0
    fname = os.path.basename(fname)
    fname_rec = os.path.splitext(fname)[0] + '.rec'
    fname_idx = os.path.splitext(fname)[0] + '.idx'
    record = mx.recordio.MXIndexedRecordIO(os.path.join(working_dir, fname_idx),
                                           os.path.join(working_dir, fname_rec), 'w')
    buf = {}
    more = True
    while more:
        deq = q_out.get()
        if deq is not None:
            i, s, item = deq
            buf[i] = (s, item)
        else:
            more = False
        while count in buf:
            s, item = buf[count]
            del buf[count]
            if s is not None:
                record.write_idx(item[0], s)

            if count % 1000 == 0:
                cur_time = time.time()
                print('time:', cur_time - pre_time, ' count:', count)
                pre_time = cur_time
            count += 1

def parse_args():
    parser = argparse.ArgumentParser(
        formatter_class=argparse.ArgumentDefaultsHelpFormatter,
        description='Create an image list or \
        make a record database by reading from an image list')
    parser.add_argument('prefix', help='prefix of input/output lst and rec files.')
    parser.add_argument('root', help='path to folder containing images.')

    cgroup = parser.add_argument_group('Options for creating image lists')
    cgroup.add_argument('--list', type=bool, default=False,
                        help='If this is set im2rec will create image list(s) by traversing root folder\
        and output to <prefix>.lst.\
        Otherwise im2rec will read <prefix>.lst and create a database at <prefix>.rec')
    cgroup.add_argument('--exts', nargs='+', default=['.jpeg', '.jpg'],
                        help='list of acceptable image extensions.')
    cgroup.add_argument('--chunks', type=int, default=1, help='number of chunks.')
    cgroup.add_argument('--train-ratio', type=float, default=1.0,
                        help='Ratio of images to use for training.')
    cgroup.add_argument('--test-ratio', type=float, default=0,
                        help='Ratio of images to use for testing.')
    cgroup.add_argument('--recursive', type=bool, default=False,
                        help='If true recursively walk through subdirs and assign an unique label\
        to images in each folder. Otherwise only include images in the root folder\
        and give them label 0.')
    cgroup.add_argument('--shuffle', type=bool, default=True, help='If this is set as True, \
        im2rec will randomize the image order in <prefix>.lst')

    rgroup = parser.add_argument_group('Options for creating database')
    rgroup.add_argument('--pass-through', type=bool, default=False,
                        help='whether to skip transformation and save image as is')
    rgroup.add_argument('--resize', type=int, default=0,
                        help='resize the shorter edge of image to the newsize, original images will\
        be packed by default.')
    rgroup.add_argument('--center-crop', type=bool, default=False,
                        help='specify whether to crop the center image to make it rectangular.')
    rgroup.add_argument('--quality', type=int, default=95,
                        help='JPEG quality for encoding, 1-100; or PNG compression for encoding, 1-9')
    rgroup.add_argument('--num-thread', type=int, default=1,
                        help='number of thread to use for encoding. order of images will be different\
        from the input list if >1. the input list will be modified to match the\
        resulting order.')
    rgroup.add_argument('--color', type=int, default=1, choices=[-1, 0, 1],
                        help='specify the color mode of the loaded image.\
        1: Loads a color image. Any transparency of image will be neglected. It is the default flag.\
        0: Loads image in grayscale mode.\
        -1:Loads image as such including alpha channel.')
    rgroup.add_argument('--encoding', type=str, default='.jpg', choices=['.jpg', '.png'],
                        help='specify the encoding of the images.')
    rgroup.add_argument('--pack-label', type=bool, default=False,
        help='Whether to also pack multi dimensional label in the record file')
    args = parser.parse_args()
    args.prefix = os.path.abspath(args.prefix)
    args.root = os.path.abspath(args.root)
    return args

if __name__ == '__main__':
    args = parse_args()
    if args.list:#生成.lst
        make_list(args)
    else:#根據.lst 生成.rec
        if os.path.isdir(args.prefix):
            working_dir = args.prefix
        else:
            working_dir = os.path.dirname(args.prefix)
        files = [os.path.join(working_dir, fname) for fname in os.listdir(working_dir)
                    if os.path.isfile(os.path.join(working_dir, fname))]
        count = 0
        for fname in files:
            if fname.startswith(args.prefix) and fname.endswith('.lst'):
                print('Creating .rec file from', fname, 'in', working_dir)
                count += 1
                image_list = read_list(fname)
                # -- write_record -- #
                if args.num_thread > 1 and multiprocessing is not None:
                    q_in = [multiprocessing.Queue(1024) for i in range(args.num_thread)]
                    q_out = multiprocessing.Queue(1024)
                    read_process = [multiprocessing.Process(target=read_worker, args=(args, q_in[i], q_out)) \
                                    for i in range(args.num_thread)]
                    for p in read_process:
                        p.start()
                    write_process = multiprocessing.Process(target=write_worker, args=(q_out, fname, working_dir))
                    write_process.start()

                    for i, item in enumerate(image_list):
                        q_in[i % len(q_in)].put((i, item))
                    for q in q_in:
                        q.put(None)
                    for p in read_process:
                        p.join()

                    q_out.put(None)
                    write_process.join()
                else:
                    print('multiprocessing not available, fall back to single threaded encoding')
                    try:
                        import Queue as queue
                    except ImportError:
                        import queue
                    q_out = queue.Queue()#FIFO
                    fname = os.path.basename(fname)
                    fname_rec = os.path.splitext(fname)[0] + '.rec'
                    fname_idx = os.path.splitext(fname)[0] + '.idx'
                    record = mx.recordio.MXIndexedRecordIO(os.path.join(working_dir, fname_idx),
                                                           os.path.join(working_dir, fname_rec), 'w')
                    cnt = 0
                    pre_time = time.time()
                    for i, item in enumerate(image_list):
                        image_encode(args, i, item, q_out)
                        if q_out.empty():
                            continue
                        _, s, _ = q_out.get()#img
                        record.write_idx(item[0], s)#write record
                        if cnt % 1000 == 0:
                            cur_time = time.time()
                            print('time:', cur_time - pre_time, ' count:', cnt)#列印時間
                            pre_time = cur_time
                        cnt += 1
        if not count:
            print('Did not find and list file with prefix %s'%args.prefix)

2.python的部分高階用法

2.1 生成器

語法：函式內部帶有yield。

生成器與普通函式的區別在於，函式帶有迭代器的性質。函式每次使用yield產生一個值，函式凍結，再次呼叫時從yield的下一行程式碼去執行，如此相當於每次呼叫next（）。

具體的用法和解釋參見

2.2 lambda表示式

類似於c+的define 函式。

2.3 多執行緒

該部分還需要繼續學習，之後再更。

im2rec.py的解讀以及python高階程式設計的一些知識點

1.mxnet 的im2rec.py註釋 # Licensed to the Apache Software Foundation (ASF) under one # or more contributor license agreements. See the NOT

python高階程式設計讀書筆記（一）

python高階程式設計讀書筆記（一） python 高階程式設計讀書筆記，記錄一下基礎和高階用法 python2和python3相容處理使用sys模組使程式python2和python3相容 import sysver=sys.version_info#(ma

python高階程式設計上— GIL全域性直譯器和深淺拷貝

①GIL：全域性直譯器鎖 1）：python直譯器分為兩種，一種是C-pytohn ,另一種是JAVA-python 2）：python語言和GIL沒有關係。GIL的造成是由於使用C-python直譯器造成的。由於90年代電腦沒有並行的多核電腦，因此C-python直譯器沒有考慮多執行緒的問

【python高階程式設計】一、遍歷資料夾目錄

前言如何遍歷查找出某個資料夾內所有的子檔案呢？並且找出某個字尾的所有檔案 walk功能簡介 1.os.walk() 方法用於通過在目錄樹種遊走輸出在目錄中的檔名，向上或者向下。 2.walk()方法語法格式如下： os.walk(top，topdown=True，onerr

Python高階程式設計——裝飾器Decorator詳解（上篇）(絕對是我見過最詳細的的教程，沒有之一哦)

一、先從一種情況開始看起 1、裝飾器decorator的由來裝飾器的定義很是抽象，我們來看一個小例子。先定義一個簡單的函式： def myfunc: print('我是函式myfunc') myfunc() #呼叫函式然後呢，我想看看

Python高階程式設計（五）XML解析

Python XML解析什麼是XML？ XML 指可擴充套件標記語言（eXtensible Markup Language）。你可以通過本站學習XML教程 XML 被設計用來傳輸和儲存資料。 XML是一套定義語義標記的規則，這些標記將文件分成許多部件並對這些部件加以標識。

Python高階程式設計（四）多執行緒

Python 多執行緒多執行緒類似於同時執行多個不同程式，多執行緒執行有如下優點：使用執行緒可以把佔據長時間的程式中的任務放到後臺去處理。使用者介面可以更加吸引人，這樣比如使用者點選了一個按鈕去觸發某些事件的處理，可以彈出一個進度條來顯示處理的進度程式的執

Python高階程式設計（三）資料庫

python操作mysql資料庫 Python 標準資料庫介面為 Python DB-API，Python DB-API為開發人員提供了資料庫應用程式設計介面。 Python 資料庫介面支援非常多的資料庫，你可以選擇適合你專案的資料庫： GadFly mSQL

Python高階程式設計（二）正則表示式

Python正則表示式正則表示式是一個特殊的字元序列，它能幫助你方便的檢查一個字串是否與某種模式匹配。 Python 自1.5版本起增加了re 模組，它提供 Perl 風格的正則表示式模式。 re 模組使 Python 語言擁有全部的正則表示式功能。 compile 函式根據一個

Python高階程式設計-多執行緒

https://www.cnblogs.com/z-joshua/p/6409362.html (一)程序執行緒概述：很多同學都聽說過，現代作業系統比如Mac OS X，UNIX，Linux，Windows等，都是支援“多工”的作業系統。什麼叫“多工”呢？簡單地說，

Python高階程式設計——裝飾器Decorator超詳細講解！

裝飾器decorator，是python語言的重要特性，上面一章節詳細講解了python裝飾器與python閉包的下篇內容，主要講解了什麼是python閉包，python閉包與裝飾器之間到底有什麼區別和聯絡。本文將介紹裝飾器系列文章補充篇，詳細介紹巢狀裝飾器的各部分類容，主要包括巢狀裝飾器的定義，執

Python高階程式設計之上下文管理器

上下文管理器上下文管理器與裝飾器類似，它們都是包裝其他程式碼的工具。但裝飾器用於包裝定義的程式碼塊(如函式或類)，而上下文管理器可以包裝任意格式的程式碼塊。如果進入上下文管理器就一定會有退出步驟，因此上下文管理器應用最多的地方就是

Python高階程式設計和非同步IO併發程式設計

第13章 asyncio併發程式設計 asyncio 作為 python 未來最有野心也是最有前景的模組，是我們學習 python 高併發程式設計的必學模組。有了12章的基礎，我們直接使用 asyncio 來進行併發程式設計就會變得容易理解，我們從 asyncio 的基本功能開始講解、如何將任務提交到