Imagenet標註檔案的Read和Write

阿新 • • 發佈：2019-01-06

image_label_util.py

#coding:utf-8
import os, cv2, shutil, random, codecs, HTMLParser
from lxml import etree
from lxml.etree import Element, SubElement, tostring

class PicAnno:
    objects = []

    def __init__(self, folder):
        self.objects = []
        self.folder = folder

    def set_folder 
(self, folder):
        self.folder = folder

    def set_filename(self, filename):
        self.filename = filename

    def set_size(self, width, height, depth):
        self.width = width
        self.height = height
        self.depth = depth

    def add_object(self, object):
        self.objects.append(object)


class 
 PicObject:
    def __init__(self, name):
        self.name = name

    def set_name(self, name):
        self.name = name

    def set_pose(self, pose):
        self.pose = pose

    def set_truncated(self, truncated):
        self.truncated = truncated

    def set_difficult(self, difficult):
        self.difficult = difficult

    def 
 set_bndbox(self, xmin, ymin, xmax, ymax):
        self.xmin = xmin
        self.ymin = ymin
        self.xmax = xmax
        self.ymax = ymax


class VocUtil:
    def read_anno_xml(self, xml_path):
        tree = etree.parse(xml_path)
        root = tree.getroot()

        # gbk
        # cmt = ''.join(codecs.open(xml_path, 'r', 'gbk').readlines())
        # root = etree.fromstring(cmt)

        picAnno = PicAnno(root.xpath('/annotation/folder')[0].text)
        picAnno.set_filename(root.xpath('/annotation/filename')[0].text)
        picAnno.set_size(root.xpath('/annotation/size/width')[0].text,
                         root.xpath('/annotation/size/height')[0].text,
                         root.xpath('/annotation/size/depth')[0].text)
        for obj in root.xpath('/annotation/object'):
            picObject = PicObject(obj.xpath('name')[0].text)
            picObject.set_pose(obj.xpath('pose')[0].text)
            picObject.set_truncated(obj.xpath('truncated')[0].text)
            picObject.set_difficult(obj.xpath('difficult')[0].text)
            picObject.set_bndbox(obj.xpath('bndbox/xmin')[0].text,
                                 obj.xpath('bndbox/ymin')[0].text,
                                 obj.xpath('bndbox/xmax')[0].text,
                                 obj.xpath('bndbox/ymax')[0].text)
            picAnno.add_object(picObject)
        return picAnno

    def parse_anno_xml(self, picAnno):
        node_root = Element('annotation')
        node_folder = SubElement(node_root, 'folder')

        if hasattr(picAnno, 'folder') and picAnno.folder is not None:
            node_folder.text = picAnno.folder

        node_filename = SubElement(node_root, 'filename')
        if hasattr(picAnno, 'filename') and picAnno.filename is not None:
            node_filename.text = picAnno.filename

        node_size = SubElement(node_root, 'size')
        node_width = SubElement(node_size, 'width')
        if hasattr(picAnno, 'width') and picAnno.width is not None:
            node_width.text = str(picAnno.width)

        node_height = SubElement(node_size, 'height')
        if hasattr(picAnno, 'height') and picAnno.height is not None:
            node_height.text = str(picAnno.height)

        node_depth = SubElement(node_size, 'depth')
        if picAnno.depth is not None:
            node_depth.text = str(picAnno.depth)

        if len(picAnno.objects) > 0:
            for obj in picAnno.objects:
                node_object = SubElement(node_root, 'object')
                node_name = SubElement(node_object, 'name')
                if hasattr(obj, 'name') and obj.name is not None:
                    node_name.text = obj.name
                node_pose = SubElement(node_object, 'pose')
                if hasattr(obj, 'pose') and obj.pose is not None:
                    node_pose.text = str(obj.pose)
                node_truncated = SubElement(node_object, 'truncated')
                if hasattr(obj, 'truncated') and obj.truncated is not None:
                    node_truncated.text = str(obj.truncated)
                node_difficult = SubElement(node_object, 'difficult')
                if hasattr(obj, 'difficult') and obj.difficult is not None:
                    node_difficult.text = str(obj.difficult)
                node_bndbox = SubElement(node_object, 'bndbox')
                node_xmin = SubElement(node_bndbox, 'xmin')
                if hasattr(obj, 'xmin') and obj.xmin is not None:
                    node_xmin.text = str(obj.xmin)
                node_ymin = SubElement(node_bndbox, 'ymin')
                if hasattr(obj, 'ymin') and obj.ymin is not None:
                    node_ymin.text = str(obj.ymin)
                node_xmax = SubElement(node_bndbox, 'xmax')
                if hasattr(obj, 'xmax') and obj.xmax is not None:
                    node_xmax.text = str(obj.xmax)
                node_ymax = SubElement(node_bndbox, 'ymax')
                if hasattr(obj, 'ymax') and obj.ymax is not None:
                    node_ymax.text = str(obj.ymax)

        xml = tostring(node_root, pretty_print=True)
        # xml_txt = str(xml,encoding='utf-8')  #window
        xml_txt = str(xml).encode('utf-8')   #linux
        xml_txt = HTMLParser.HTMLParser().unescape(xml_txt)
        return xml_txt

    def save_anno_xml(self, xml_path, xml_text):
        with codecs.open(xml_path, 'w', 'utf-8') as f:
            f.write(xml_text)


    def readFile(self, path):
        file = open(path, 'r')
        lines = [line.strip() for line in file.readlines()]
        file.close()
        return lines

    def writeLines(self,file_path, lines):
        file_dir = os.path.dirname(file_path)
        if not os.path.exists(file_dir):
            os.makedirs(file_dir)
        fr = open(file_path, 'w')
        for line in lines:
            fr.write(line.strip() + '\n')
        fr.close()

    def gene_train_test_val_txt(self,anno_dir,txt_dir):
        pic_names = [pic_name.split('.')[0] for pic_name in os.listdir(anno_dir) if pic_name.endswith('.xml')]
        random.shuffle(pic_names)
        self.writeLines(os.path.join(txt_dir, 'test.txt'), pic_names)
        random.shuffle(pic_names)
        self.writeLines(os.path.join(txt_dir, 'train.txt'), pic_names)
        random.shuffle(pic_names)
        self.writeLines(os.path.join(txt_dir, 'trainval.txt'), pic_names)
        random.shuffle(pic_names)
        self.writeLines(os.path.join(txt_dir, 'val.txt'), pic_names)
        print('生成測試集、訓練集、訓練驗證集、驗證集完成！')

Imagenet標註檔案的Read和Write

image_label_util.py #coding:utf-8 import os, cv2, shutil, random, codecs, HTMLParser from lxml import etree from lxml.etree import

Linux下的C語言程式設計——系統呼叫read和write函式實現檔案拷貝

系統呼叫read和write函式實現檔案拷貝 #include <stdio.h> #include <sys/types.h> #include <sys/st

read 和write

exceptio ner row obia code stat java lose ted read： import java.io.FileReader; //導入包import java.io.IOException; //導入

read和write函數

次循環 ring 讀取時間片超時時間 jsb 排序結合通過 1、write() 函數定義：ssize_t write (int fd, const void * buf, size_t count); 函數說明：write()會把參數buf所指的內存寫入cou

C語言read和write函式解析

在研究一份AES加密程式碼的時候，發現程式碼從command line獲取資料僅僅使用了read函式，很是疑問。從command line獲取資料不是要使用scanf函式嗎？所以，詳細瞭解了C庫的read函式特性。順帶了write函式，他們是couple一對兒!!! 主要參考文章：h

組合語言呼叫Linux系統呼叫read和write

.section .data UserMsg: .ascii "Please input the message:" LenOfUserMsg: .equ lenMsg, LenOfUserMsg - UserMsg #.section .bss # .lcomm r

linux中的read和write系統呼叫

linux中read和write系統呼叫在這裡小koala著重於read()和write()來讀寫普通檔案，因為小koala在編寫實際檔案讀寫函式時，疏忽了一些重要的地方，造成無休止的向系統中寫資料，最後系統崩潰。當時瞬間“三觀”盡毀。現在較為詳細地分析錯誤

Python中read和write用法

1、讀操作讀操作有read、readline和readlines函式看示例： f = open('1.txt','r') data = f.read() #讀出所有的內容 print data f.close()結果： >>> I'm

字元裝置之read和write

1.核心空間的read()和write(): read和write最大的意義是完成使用者空間到核心空間的資料互動.其原型如下: ssize_t read(struct file *filp,char __user *buff,size_t count,lof

用read（）和write（）讀寫二進位制檔案

#include<iostream> #include<fstreeam> #include<cstring> #include<cstdlib> us

Nginx事件處理中的connection和read、write事件的關聯

ase handle inux cycle ngx auth eof conn ont /********************************************************************* * Author : Samson

Unix系統編程（）open，read，write和lseek的綜合練習

har ring strtol 開始 splay 進制 void oct unsigned 需求：程序的第一個命令行參數為將要打開的文件名稱，余下的參數則指定了文件上執行的輸入輸出操作。每個表示操作的參數都以一個字母開頭，緊跟以相關值（中間無空格分隔）。 soffet：

c/c++ 學習-read 函式和 write 函式

read 函式和 write 函式最近開始從事搜尋引擎的工作,所以又重新開始了c/c++的旅程,時隔4年不得不復習一下c/c++其中的內容,以下內容有網上別的朋友發表的,也有我自己總結的.1. read #include ssize_t re

【Linux】使用read、write、lseek函式實現檔案讀寫操作

本文章主要講述Linux環境下檔案的讀寫操作，使用到的函式有open、read、write、lseek。 open:用於開啟或者建立檔案。 read:從檔案中讀指定位元組的資料到記憶體中。 write：講記憶體中資料寫入到檔案中。 lseek：可以改變當前檔案偏移量。 #

檔案操作程式設計一（open、close、read、write、lseek函式的使用）

一、open()函式用於開啟或建立檔案，在開啟或建立檔案時可以指定檔案的屬性及使用者的許可權等各種引數所需標頭檔案：#include <sys/types.h> /* 提供型別pid_t 的定義 */ #include <sys/stat.h> #

Spark WordCount 讀寫hdfs檔案 (read file from hadoop hdfs and write output to hdfs)

create a scala project and a WordCount class as follow: package com.qiurc.test import org.apache.spark._ import SparkContext._ o

系統呼叫——open、write、read和close

一、檔案描述符每一個程序都有一個與之相關的檔案描述符，它們是一些小值整數，我們可以通過這些檔案描述符來訪問開啟的檔案。一般地，一個程式開始執行時，會自動開啟3個檔案描述符： 0——–標準輸入———-stdin 1——–標準輸出———-stdout

Android JNI層實現檔案的read、write與seek操作

轉自：http://blog.csdn.net/conowen/article/details/7525837 /*******************************************************************************

十五、1檔案的相關操作：開啟檔案的方法、關閉檔案、【write（）、read（）】、檔案備份的流程小例子、readlines、readline

一、開啟方式在python，使用open函式，可以開啟一個已經存在的檔案，或者建立一個新檔案。 open(檔名，訪問模式) ——以只讀的方式開啟test.txt檔案在面向物件oop語言中把【函式名（）】這種形式我們叫做【方法】。（1）文字檔

檔案 I/O操作open、lseek、read、write、close詳解

一，檔案描述符、套接字和管道對於核心而言，所有開啟的開啟的檔案都通過檔案描述符引用。檔案描述符是一個非負整數。核心為每個程序維護一個結構體struct task_struct，可稱為程序控制塊（PCB: Process Control Bloc

Imagenet標註檔案的Read和Write

相關推薦