forked from PatrickLib/captcha_recognize
-
Notifications
You must be signed in to change notification settings - Fork 0
/
captcha_gen_default.py
60 lines (52 loc) · 1.74 KB
/
captcha_gen_default.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function
import argparse
import random
import os
from captcha.image import ImageCaptcha
import config
IMAGE_HEIGHT = config.IMAGE_HEIGHT
IMAGE_WIDTH = config.IMAGE_WIDTH
CHARS_NUM = config.CHARS_NUM
TEST_SIZE = 1000
TRAIN_SIZE = 50000
VALID_SIZE = 20000
FLAGS = None
def gen(gen_dir, total_size, chars_num):
if not os.path.exists(gen_dir):
os.makedirs(gen_dir)
image = ImageCaptcha(width=IMAGE_WIDTH, height=IMAGE_HEIGHT,font_sizes=[40])
# must be subset of config.CHAR_SETS
char_sets = 'ABCDEFGHIJKLMNPQRSTUVWXYZ'
for i in xrange(total_size):
label = ''.join(random.sample(char_sets, chars_num))
image.write(label, os.path.join(gen_dir, label+'_num'+str(i)+'.png'))
if __name__ == '__main__':
parser = argparse.ArgumentParser()
parser.add_argument(
'--test_dir',
type=str,
default='./data/test_data',
help='Directory testing to generate captcha data files'
)
parser.add_argument(
'--train_dir',
type=str,
default='./data/train_data',
help='Directory training to generate captcha data files'
)
parser.add_argument(
'--valid_dir',
type=str,
default='./data/valid_data',
help='Directory validation to generate captcha data files'
)
FLAGS, unparsed = parser.parse_known_args()
print('>> generate %d captchas in %s' % (TEST_SIZE, FLAGS.test_dir))
gen(FLAGS.test_dir, TEST_SIZE, CHARS_NUM)
print ('>> generate %d captchas in %s' % (TRAIN_SIZE, FLAGS.train_dir))
gen(FLAGS.train_dir, TRAIN_SIZE, CHARS_NUM)
print ('>> generate %d captchas in %s' % (VALID_SIZE, FLAGS.valid_dir))
gen(FLAGS.valid_dir, VALID_SIZE, CHARS_NUM)
print ('>> generate Done!')