-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathPreprocess.py
executable file
·77 lines (53 loc) · 1.6 KB
/
Preprocess.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
#!coding: utf-8
import os, Image, ImageStat
SEUIL = 180
def preprocess_captcha(path, parent):
if not os.path.isfile(path):
print "FICHIER INEXISTANT"
return
im=Image.open(path)
im = im.crop((24, 8, 151, 39)).convert('L')
w = im.size[0]
h = im.size[1]
for i in xrange(w):
for j in xrange(h):
val = im.getpixel((i,j))
if val < SEUIL:
val = 0
else:
val = 255
im.putpixel((i,j), val)
#Si parent=None, on enlève le blanc sur les cotés
minx=100000
maxx=0
for i in xrange(w):
for j in xrange(h):
if im.getpixel((i,j)) == 0:
if i<minx:
minx=i
if i>maxx:
maxx=i
im = im.crop((minx, 0, maxx, 31))
DEST = path[:-4]+".bmp"
im.save(DEST)
return DEST
## Prend en argument le chemin de l'image, et la transforme en une liste à donner à la SVM
## Rescale et centre les données
def load_image_with_mean(path):
im = Image.open(path)
#Puts all values between 0 and 1
im = im.point(lambda e : e/255.)
#Transforms into list
data = list(im.getdata())
#Centers data
stat = ImageStat.Stat(im)
mean = stat.mean[0]
data = map(lambda e : e/mean, data)
return data
def load_image(path):
im = Image.open(path)
#Puts all values between 0 and 1
im = im.point(lambda e : e/255.)
#Transforms into list
data = list(im.getdata())
return data