forked from sunshineInmoon/Tools
-
Notifications
You must be signed in to change notification settings - Fork 0
/
text_process.py
189 lines (178 loc) · 6.23 KB
/
text_process.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
# -*- coding: utf-8 -*-
"""
Created on Thu Mar 31 11:51:03 2016
@author: Administrator
"""
import cv2
import os
import shutil
import csv as CSV
'''
函数:name_convert()
功能:采集到的图片名字命名时是字符型,将其转换成000000001形式
另外进行比例缩放到128*128,同时转成灰度图
输入的参数:dir_name 只存放图片的文件夹名字
dir_name_save 保存结果文件夹
'''
def name_convert(dir_name,dir_name_save):
num = 0
for dirpath,dirnames,filenames in os.walk(dir_name):
for files in filenames:
image_path = dir_name + '/' + files
img = cv2.imread(image_path)
res = cv2.resize(img,(128,128))
gray = cv2.cvtColor(res,cv2.COLOR_BGR2GRAY)
save_file_path = "%s%s%09d%s"%(dir_name_save,'/',num,'.bmp')
num += 1
if num%1000 == 0:
print u'已经完成 %d 张........'%(num)
cv2.imwrite(save_file_path,gray)
print u'name_covert 完成 共处理 %d 张图片'%(num)
'''
函数:creat_imagelist_NoLabel()
功能:是把一个文件夹下所有图片写进一个imagelist.txt文件中
输入参数:dir_path 存放图片的文件夹
imagelist_path,保存路径
issubdir----是否有子文件 修改于2016年5月19日14:27:14
'''
def creat_imagelist_NoLabel(dir_path,imagelist_path,issubdir='false'):
if issubdir == 'false':
fr = open(imagelist_path,'w')
count = 0
for dirpath,dirnames,filenames in os.walk(dir_path):
for files in filenames:
image_path = dir_path + '/' + files + '\n'
fr.write(image_path)
count += 1
fr.close()
print u'creat_imageslist_NoLabel 完成,共%d张图片'%(count)
else:#修改于2016年5月19日14:28:51
fr = open(imagelist_path,'w')
count = 0
dirs = os.listdir(dir_path)
for sub in dirs:
sub_name = dir_path + '/' + sub
if os.path.isdir(sub_name):
files = os.listdir(sub_name)
for filename in files:
file_path = sub_name + '/' + filename
fr.write(file_path+'\n')
count += 1
else:
fr.write(sub_name+'\n')
count += 1
fr.close()
print u'creat_imageslist_NoLabel 完成,共%d张图片'%(count)
'''
函数:clean_image()
功能:人脸检测后把没有检测到的人脸剔除
输入参数:imagelist---人脸检测后的路劲列表
dir_path_save---保存路径
'''
def clean_image(imagelist,dir_path_save):
if not os.path.exists(dir_path_save):
os.mkdir(dir_path_save)
fr = open(imagelist,'r')
lines = fr.readlines()
num = 0
for line in lines:
sourcefile_path = line.strip('\n')
targefile_path = "%s%s%09d%s"%(dir_path_save,'/',num,'.bmp')
shutil.copyfile(sourcefile_path,targefile_path)
num += 1
if num%1000 == 0:
print u"clean_image %d 张图片"%(num)
print u"已经完成 clean_image 共%d张图片"%(num)
'''
函数:CreatImageListWithLabel()
功能:创建caffe imagelist.txt 文件,此文件带标签
输入参数:dir_path 图片路径,一般为保存很多子文件夹的跟文件夹路径
imgelist 输出文件路径默认是当前文件夹下
'''
def CreatImageListWithLabel(dir_path,imagelist):
fr = open(imagelist,'w')
Label_Num = 0
for parent,dirnames,filenames in os.walk(dir_path):
#print u'共有%d个子文件夹,即共有%d类'%(len(dirnames),len(dirnames))
for label,dirname in enumerate(dirnames):
#print cls
#print dirname
for subparent,subdirnames,subfilenames in os.walk(dir_path + '/' + dirname):
for filename in subfilenames:
#print dirname + '/' + filename
image_path ="%s%s%s%s %d\n"%('/',dirname,'/',filename,label)
fr.write(image_path)
Label_Num = label
print u'共有%d类'%(Label_Num)
fr.close()
'''
函数:TxtToCsv()
函数功能:将.txt文件转换成csv,这个函数只是在特定情况,针对特定类型.txt使用,
并不通用
输入参数:txt----.txt文件
csv----.csv文件
'''
def TxtToCsv(txtfile,csvfile):
fr = open(txtfile,'r')
csvfile = file(csvfile,'wb')
writer = CSV.writer(csvfile)
writer.writerow(['No','Sample','Similar'])
num = 0
for line in fr.readlines():
#print line
curline = line.strip().split(',')
no = num
if curline[1] == u'负样本'.encode('UTF-8'):
sample = 0
else:
sample = 1
sim = curline[2].split(':')[-1]
data=[no,sample,sim]
writer.writerow(data)
num += 1
'''
函数:Find()
函数功能:寻找包含特定文件数的文件夹
输入参数:dirpath----数据集路径
num----文件夹的数量
'''
def Find(dirpath,num=0):
if not os.path.exists(dirpath):
print u'路径不存在!'
dirs = os.listdir(dirpath)
for sub in dirs:
subdir = dirpath + '/' + sub
files = os.listdir(subdir)
if len(files) == num:
print subdir
img = cv2.imread(subdir+'/'+files[0])
cv2.imshow('res',img)
cv2.waitKey()
cv2.destroyWindow('res')
else:
continue
if __name__ == '__main__':
'''
dir_name = 'E:/practical_face/LogPhoto'
dir_name_save = 'E:/practical_face/result/passerbPhoto'
imagelist = 'E:/practical_face/imagelist.txt'
if not os.path.exists(dir_name_save):
os.mkdir(dir_name_save)
'''
'''
name_convert(dir_name,dir_name_save)
'''
'''
imagelist_path = 'E:/practical_face/result/imagelist.txt'
creat_imagelist_NoLabel(dir_name_save,imagelist_path)
'''
'''
clean_image('E:/practical_face/result/clean_imagelist.txt','E:/practical_face/result/clean_image')
'''
#CreatImageListWithLabel(dir_name,imagelist)
'''
txt = r'E:/Face_data/result_my_2.txt'
csv = r'E:/Face_data/result.csv'
TxtToCsv(txt,csv)
'''
Find('E:/Face_data/FaceImages3')