WowSign/picPreHandle.py at master · shark526/WowSign · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
# -*- coding:utf-8 -*-
# import numpy as np
# import matplotlib.pyplot as plt
# from sklearn.cluster import KMeans
import StringIO
# import sys
from PIL import Image
import PIL.ImageOps
import urllib
import os
import pytesseract
import numpy as np


def saveSampleImg():
	if not os.path.exists('source_img'):
		os.mkdir('source_img')
	for i in xrange(50):
		#save images
		img = Image.open(StringIO.StringIO(urllib.urlopen('http://169ol.com/Stream/Code/getCode').read()))
		imgPath = "source_img/%d.png" %i
		#print imgPath
		img.save(imgPath)

def binarizing(img,threshold): #input: gray image, get black and white images
	pixdata = img.load()
	w, h = img.size
	for y in range(h):
		for x in range(w):
			if pixdata[x, y] < threshold:
				pixdata[x, y] = 0
			else:
				pixdata[x, y] = 255
	return img
def depoint(img,revert=False):   #input: gray image, remove the noise
	pixdata = img.load()
	w,h = img.size
	if revert==False:
		for y in range(0,h):
			for x in range(0,w):
					#remove the frame
					if(y==0 or y==h-1 or x==0 or x==w-1):
						pixdata[x,y] = 255
					count = 0
					if y-1>=0 and pixdata[x,y-1] > 245:
						count = count + 1
					if y+1 < h and pixdata[x,y+1] > 245:
						count = count + 1
					if x-1>=0 and pixdata[x-1,y] > 245:
						count = count + 1
					if x+1 < w and pixdata[x+1,y] > 245:
						count = count + 1
					if count > 2:
						pixdata[x,y] = 255
	else:
		for y in range(h-1,-1,-1):
			for x in range(w-1,-1,-1):
					count = 0
					if y-1>=0 and pixdata[x,y-1] > 245:
						count = count + 1
					if y+1<h and pixdata[x,y+1] > 245:
						count = count + 1
					if x-1>=0 and pixdata[x-1,y] > 245:
						count = count + 1
					if x+1 <w and pixdata[x+1,y] > 245:
						count = count + 1
					if count > 2:
						pixdata[x,y] = 255

#图片x轴的投影，如果有数据（黑色像素点0）值为1否则为0
def get_projection_x(image,invert=False):
	p_x = [0 for x in xrange(image.size[0])]
	for w in xrange(image.size[1]):
		for h in xrange(image.size[0]):
			if invert:
				if image.getpixel((h,w)) == 255:
					p_x[h] = 1
					continue
			else:
				if image.getpixel((h,w)) == 0:
					p_x[h] = 1
					continue
	return p_x

#获取分割后的x轴坐标点
#返回值为[起始位置, 长度] 的列表
def get_split_seq(projection_x):
	res = []
	for idx in xrange(len(projection_x) - 1):
		p1 = projection_x[idx]
		p2 = projection_x[idx + 1]
		if p1 == 1 and idx == 0:
			res.append([idx, 1])
		elif p1 == 0 and p2 == 0:
			continue
		elif p1 == 1 and p2 == 1:
			res[-1][1] += 1
		elif p1 == 0 and p2 == 1:
			res.append([idx + 1, 1])
		elif p1 == 1 and p2 == 0:
			continue
	return res


def get_img_width(projection_x):
	start_pos = 0
	stop_pos = 0
	pro_len = len(projection_x) - 1
	for idx in xrange(pro_len):
		if projection_x[idx] > 0:
			start_pos = idx
			break
	for idx in xrange(pro_len):
		if projection_x[pro_len - idx] > 0:
			stop_pos = pro_len - idx
			break

	return stop_pos - start_pos


# 旋转卡壳
def rotating_calipers(image):
	# original with
	min_width = 100
	min_angle = 100
	for angle in xrange(-60, 60):
		temp_img = image.rotate(angle, expand=True)
		jection = get_projection_x(temp_img, True)
		cur_width = get_img_width(jection)

		if (cur_width < min_width):
			min_width = cur_width
			min_angle = angle

	return image.rotate(min_angle, expand=True)
#分割后的图片，x轴分割后，同时去掉y轴上线多余的空白
def split_image(image, split_seq=None,save_temp=False):
	#image = PIL.ImageOps.invert(image)#反转颜色
	if split_seq is None:
		split_seq = get_split_seq(get_projection_x(image))
	length = len(split_seq)
	imgs = [[] for i in xrange(length)]
	res = []
	for w in xrange(image.size[1]):
		line = [image.getpixel((h,w)) for h in xrange(image.size[0])]
		for idx in xrange(length):
			pos = split_seq[idx][0]
			llen = split_seq[idx][1]
			l = line[pos:pos+llen]
			imgs[idx].append(l)
	ind = 0
	for idx in xrange(length):
		datas = []
		height = 0
		for data in imgs[idx]:
			flag = False
			for d in data:
				if d == 0:
					flag = True
			if flag == True:
				height += 1
				datas += data
		if height <5: # ignore the small image
			continue
		child_img = Image.new('L',(split_seq[idx][1], height))
		child_img.putdata(datas)
		inverted_img = PIL.ImageOps.invert(child_img)
		adjusted_img = rotating_calipers(inverted_img)
		if save_temp:
			tempNumImg = 'temp/0-%d.png' % ind
			adjusted_img.save(tempNumImg)
		ind = ind +1
		#print tempNumImg
		res.append(adjusted_img)
		# recNum = pytesseract.image_to_string(adjusted_img, config='-psm 6 outputbase digits')
		# print recNum

	return res

#saveSampleImg()
def rec_img(imgPath):
	img = Image.open(imgPath).convert("L")
	binarizing(img,170)
	# img.save('C:\\NotBackedUp\\00.png')
	depoint(img)
	depoint(img,True)
	# img.save('C:\\NotBackedUp\\01.png')
	seperated_img = split_image(img,save_temp=True)
	recdString = ""
	for cur_img in seperated_img:
		recNum = pytesseract.image_to_string(cur_img,config='-psm 10 outputbase digits')
		recdString = recdString + recNum

	print recdString
	#img.save('temp/%s.png' % recdString)
	if len(recdString)==4:
		# img.save('temp/%s.png' % recdString)
		print "success"
	else:
		print "error ..."
		img.save('temp/error_%s.png' % recdString)
	return recdString

def resize(img,w_h):
    img_w, img_h = img.size
    background = Image.new('RGBA', w_h, (255, 255, 255, 255))
    background = background.convert("L")
    bg_w, bg_h = background.size
    offset = ((bg_w - img_w) / 2, (bg_h - img_h) / 2)
    background.paste(img, offset)
    return background

def getfiles(dirs):
	fs = []
	for fr in os.listdir(dirs):
		f = dirs + fr
		if f.rfind(u'.DS_Store')==-1:
			fs.append(f)
	return fs

#passing opend image
def getBinaryPix(im):
	img = np.array(im)
	rows, cols = img.shape
	for i in range(rows):
		for j in range(cols):
			if (img[i, j] < 255):
				img[i, j] = 0
			else:
				img[i, j] = 1
		binpix = np.ravel(img) # img.reshape(1, rows * cols)
	return binpix

def loadSplitedBinaryPixImg(imgPath):
    img = Image.open(imgPath).convert("L")
    binarizing(img, 170)
    depoint(img)
    depoint(img, True)
    imgs = split_image(img)
    rs=[]
    for cimg in imgs:
        cimg = PIL.ImageOps.invert(cimg)
        cimg = resize(cimg,(20,25))
        pixs=getBinaryPix(cimg)
        rs.append(pixs)
    return rs

def extractIdentityData():
	dirs = "category/%s/"
	for i in range(10):
		for f in getfiles(dirs % i):
			img = Image.open(f)
			pixs = getBinaryPix(img).tolist()
			pixs.append(i)
			pixs = [str(i) for i in pixs]
			content = ','.join(pixs)
			with open('train_data.txt','a+') as f:
				f.write(content)
				f.write('\n')
				f.close()


if __name__=="__main__":
	# filePath = 'error_675.png'
	# rec_img(filePath)

	#resize images
	# dirs = "category/%s/"
	# for i in range(10):
	# 	for f in getfiles(dirs % (i)):
	# 		img = Image.open(f, 'r')
	# 		inverted_img = PIL.ImageOps.invert(img)
	# 		adjusted_img = rotating_calipers(inverted_img)
	# 		img = PIL.ImageOps.invert(adjusted_img)
	# 		img = resize(img, (20, 25))
	# 		img.save(f)

	extractIdentityData()