forked from pcyin/NL2code
-
Notifications
You must be signed in to change notification settings - Fork 0
/
project_work.py
56 lines (47 loc) · 1.64 KB
/
project_work.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
# open('/content/NL2code/all.anno')
from nn.utils.generic_utils import init_logging
from nn.utils.io_utils import deserialize_from_file, serialize_to_file
print('Hi')
print('Hello')
train_data, dev_data, test_data = deserialize_from_file('/content/NL2code/data/hs.freq3.pre_suf.unary_closure.bin')
print('Total Grammar Rules: ' + str(len(train_data.grammar.rules)))
print('Total Annotation Vocabs: ' + str(len(train_data.annot_vocab.token_id_map)))
print('Total Terminal Vocabs: ' + str(len(train_data.terminal_vocab.token_id_map)))
print('Total examples: ' + str(train_data.examples))
print('-' * 100)
for i, grammar_rule in enumerate(train_data.grammar.rules):
print(grammar_rule)
if i == 10:
break
print('-' * 100)
for i, annot_vocab in enumerate(train_data.annot_vocab.token_id_map):
print(annot_vocab)
if i == 50:
break
print('-' * 100)
for i, annot_vocab in enumerate(train_data.annot_vocab.token_id_map):
print(annot_vocab)
if i == 50:
break
print('-' * 100)
for i, terminal_vocab in enumerate(train_data.terminal_vocab.token_id_map):
print(terminal_vocab)
if i == 50:
break
print('-' * 100)
for i, example in enumerate(train_data.examples):
print('####### Parse Tree #########')
print(example.parse_tree)
print('####### Code #########')
print(example.code)
print('####### Query #########')
print(example.query)
print('####### Actions #########')
print(example.actions)
if i == 1:
break
# print(train_data.examples[0].parse_tree)
# print(train_data.annot_vocab.token_id_map)
# print(train_data.terminal_vocab.token_id_map)
# print(train_data.grammar.rules)
# print(train_data.grammar.node_type_to_id)