-
Notifications
You must be signed in to change notification settings - Fork 0
/
clumpfinding.py
86 lines (69 loc) · 26.3 KB
/
clumpfinding.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
__author__ = 'ssen'
import computingfrequencies
def numberToSymbol(i):
switcher = {
0:'A',
1:'C',
2:'G',
3:'T'
}
return switcher.get(i)
def numberToPattern(i, k):
if k==1:
return numberToSymbol(i)
prefIndex = i//4;
r=i%4
symbol = numberToSymbol(r)
prefixPattern = numberToPattern(prefIndex,k-1)
return prefixPattern + symbol
def clumpfinding(genome, k, t, L):
frequentpatterns=[]
clump =[]
for i in range(0, pow(4,k)):
clump.append(0)
for i in range(0,len(genome)-L+1):
text = genome[i:i+L]
freqArray = computingfrequencies.computing_frequencies(text,k)
for indx in range(0,pow(4,k)):
if freqArray[indx] >= t:
clump[indx]=1
for i in range(0,pow(4,k)):
if clump[i]==1:
pattern = numberToPattern(i,k)
frequentpatterns.append(pattern)
return frequentpatterns
def betterclumpfinding(genome, k, t, L):
frequentpatterns=[]
clump =[]
for i in range(0, pow(4,k)):
clump.append(0)
text = genome[0:L]
freqArray = computingfrequencies.computing_frequencies(text,k)
for i in range(0,pow(4,k)):
if freqArray[i] >= t:
clump[i]=1
for i in range(1,len(genome)-L+1):
firstPattern = genome[i-1:i-1+k]
index = computingfrequencies.patternToNumber(firstPattern)
freqArray[index] = freqArray[index]-1
lastPattern = genome[i+L-k:i+L]
index = computingfrequencies.patternToNumber(lastPattern)
freqArray[index] = freqArray[index]+1
if freqArray[index]>=t:
clump[index] = 1
for i in range(0,pow(4,k)):
if clump[i]==1:
pattern = numberToPattern(i,k)
frequentpatterns.append(pattern)
return frequentpatterns
#print (numberToPattern(45,4))
#print (betterclumpfinding('CGGACTCGACAGATGTGAAGAACGACAATGTGAAGACTCGACACGACAGAGTGAAGAGAAGAGGAAACATTGTAA', 5,4,50))
#f=open('C:/E-coli.txt')
f=open('C:/dataset_4_5.txt')
s=f.read()
#9 484 19
print (betterclumpfinding(s,9,19,484))
#CGACA GAAGA
#print (computingfrequencies.patternToNumber('AGT'))
#a=['AAAAAAAAG', 'AAAAAAAGC', 'AAAAAAGCC', 'AAAAACCCG', 'AAAAAGCAG', 'AAAAAGCCC', 'AAAAAGCCG', 'AAAAATGAT', 'AAAAATTGA', 'AAAACCCGC', 'AAAAGCCCG', 'AAAAGCGGC', 'AAAAGTTGC', 'AAAATATTT', 'AAAATCGCA', 'AAACCCGCC', 'AAACGCCTT', 'AAACTGACC', 'AAACTGGCA', 'AAAGAAGCT', 'AAAGCAGAA', 'AAAGCCCGT', 'AAAGCCGCC', 'AAAGCGCGC', 'AAAGCGGCA', 'AAAGCGGCT', 'AAAGCGGTT', 'AAAGTGATG', 'AAAGTTGCC', 'AAATAATCT', 'AAATATGGC', 'AAATCCGGC', 'AAATCGCAG', 'AAATGATGA', 'AAATGGCGA', 'AAATGGCGC', 'AAATGGCGG', 'AACAACCGG', 'AACACCTGA', 'AACAGCAAC', 'AACAGCACG', 'AACAGGCTA', 'AACAGGTCG', 'AACCAGCAG', 'AACCCCCAC', 'AACCCGAAG', 'AACCCGCCG', 'AACCGATGC', 'AACCGGTTG', 'AACCGTAGG', 'AACCTCCGA', 'AACGCCTGA', 'AACGCCTTA', 'AACGCGTCT', 'AACGCTCTC', 'AACGGCTGT', 'AACTGACCG', 'AACTGGCTG', 'AACTGTAGG', 'AAGAAAGCG', 'AAGAACAGC', 'AAGAACAGG', 'AAGACGCAC', 'AAGACGCAT', 'AAGACGCGC', 'AAGACGCGT', 'AAGAGATGG', 'AAGATGCGC', 'AAGCAGAAG', 'AAGCCCGTA', 'AAGCCGCCG', 'AAGCCGCTA', 'AAGCCGCTT', 'AAGCGCGCA', 'AAGCGGCAG', 'AAGCGGCTG', 'AAGCGGGTT', 'AAGCGGTTG', 'AAGCGTAGC', 'AAGCGTCGC', 'AAGCTAGCG', 'AAGCTGGAA', 'AAGCTTCTC', 'AAGGAGGGG', 'AAGGATTAC', 'AAGGCACTT', 'AAGGCGGTT', 'AAGGCGTTC', 'AAGGCGTTT', 'AAGGTCGGG', 'AAGGTCGTC', 'AAGTGATGG', 'AAGTGCTCC', 'AAGTTGAAG', 'AAGTTGCCG', 'AATAATCTA', 'AATAGCCTG', 'AATAGCTCA', 'AATATCAGC', 'AATATGGCG', 'AATATTGGT', 'AATCAATGC', 'AATCAATTG', 'AATCCGGCC', 'AATCCTGCA', 'AATCGCAGC', 'AATCTGGCA', 'AATCTGTAG', 'AATGATGAA', 'AATGCCAGC', 'AATGCCTGA', 'AATGGCGCT', 'AATTCCGCC', 'AATTGGTCG', 'AATTTGTAG', 'ACAAAATCG', 'ACAAACGCA', 'ACAACCGAT', 'ACAACCGGT', 'ACAAGGAGG', 'ACAATGCCT', 'ACACCGCTG', 'ACACCTGAA', 'ACACTAACA', 'ACAGCAACA', 'ACAGCGCAA', 'ACAGCGTCG', 'ACAGGCTAA', 'ACAGGTCGA', 'ACAGTCATT', 'ACATCAACG', 'ACATCCAAC', 'ACATCTAAC', 'ACATTATTG', 'ACCAATTCC', 'ACCCACCAA', 'ACCCACCAC', 'ACCCCCACG', 'ACCCCGTAG', 'ACCCGAAGG', 'ACCCGCCGA', 'ACCGATAAG', 'ACCGATGCC', 'ACCGCTACT', 'ACCGCTCGG', 'ACCGCTGTG', 'ACCGCTTGG', 'ACCGGTTGC', 'ACCGTAGGC', 'ACCGTGCTG', 'ACCGTTGCC', 'ACCTACGGT', 'ACCTCCCTT', 'ACCTCCGAC', 'ACCTGAAGC', 'ACCTGTAGG', 'ACCTTGCCA', 'ACGAAAAAA', 'ACGACCCAC', 'ACGACCTTG', 'ACGACGCGG', 'ACGACGTTC', 'ACGACTGCC', 'ACGAGCTCT', 'ACGATATTA', 'ACGCACAGC', 'ACGCATAGC', 'ACGCATTAC', 'ACGCCAGAC', 'ACGCCGCAT', 'ACGCCTGAT', 'ACGCCTTAT', 'ACGCGACTT', 'ACGCGCAAG', 'ACGCGGGGT', 'ACGCGTCGC', 'ACGCGTCTT', 'ACGCGTTAG', 'ACGCTCTCT', 'ACGCTCTTT', 'ACGCTGGCG', 'ACGCTGTCG', 'ACGCTTAAC', 'ACGGAGGGT', 'ACGGATGCA', 'ACGGATGGC', 'ACGGCTGCC', 'ACGGTCTGT', 'ACGGTGCTA', 'ACGGTTATG', 'ACGTCCGTA', 'ACTAAAGCC', 'ACTAACACC', 'ACTATGGCA', 'ACTCAGCGC', 'ACTCGCTTC', 'ACTCTATCC', 'ACTGAACTG', 'ACTGACCGA', 'ACTGCCGGA', 'ACTGCGTTC', 'ACTGGAGTT', 'ACTGGCTGT', 'ACTGTAGGC', 'ACTGTAGGT', 'ACTTATCAG', 'ACTTGAACC', 'ACTTGTGCC', 'ACTTTCGTA', 'ACTTTTAAT', 'AGAAAAAGC', 'AGAAAGCGG', 'AGAACAGGT', 'AGAAGAACA', 'AGAATATTT', 'AGAATCTGT', 'AGACAGCGC', 'AGACGCACA', 'AGACGCATA', 'AGACGCATT', 'AGACGCGCA', 'AGACGCGTT', 'AGAGATGGT', 'AGAGCACCT', 'AGAGCACGA', 'AGAGCAGTT', 'AGATGCGCA', 'AGATGGGAG', 'AGATGGTGC', 'AGCAACAGG', 'AGCACCTCC', 'AGCACGACC', 'AGCAGAAGC', 'AGCAGCCGC', 'AGCAGCCTG', 'AGCAGTTGA', 'AGCCCGCTC', 'AGCCCGTAC', 'AGCCGAGTA', 'AGCCGCAAC', 'AGCCGCCGT', 'AGCCGCTAT', 'AGCCGCTTT', 'AGCCGGTTG', 'AGCCTGATT', 'AGCCTGGTA', 'AGCGCAATA', 'AGCGCACCA', 'AGCGCATCA', 'AGCGCCTTA', 'AGCGCGCAA', 'AGCGCGTCT', 'AGCGCTGCG', 'AGCGGCTGC', 'AGCGGGTTT', 'AGCGGTTGA', 'AGCGTAGCG', 'AGCGTCGCA', 'AGCGTGATT', 'AGCTACGGA', 'AGCTAGCGC', 'AGCTCAGCT', 'AGCTCAGTT', 'AGCTCCGGC', 'AGCTCGTCG', 'AGCTCTTCT', 'AGCTGAGCT', 'AGCTGCAGC', 'AGCTGGAAC', 'AGCTGGATG', 'AGCTGGGAG', 'AGCTTCTCA', 'AGGAGGGGG', 'AGGAGTTAA', 'AGGATTACT', 'AGGATTCGA', 'AGGCAACGG', 'AGGCACTTG', 'AGGCAGTCG', 'AGGCATCTG', 'AGGCATTTG', 'AGGCCGGAT', 'AGGCCTACA', 'AGGCCTACG', 'AGGCCTGAT', 'AGGCGGTTA', 'AGGCGTTCA', 'AGGCGTTTA', 'AGGCTAATG', 'AGGGGGGGA', 'AGGGGGGGG', 'AGGGGGTCG', 'AGGGTGCGG', 'AGGTCGATC', 'AGGTCGGAT', 'AGGTCGGGG', 'AGGTCGTCG', 'AGGTGAAAC', 'AGGTGGGTC', 'AGGTTCGAA', 'AGGTTTTCC', 'AGTACTCTA', 'AGTCATCCT', 'AGTCATTCA', 'AGTCGGCAC', 'AGTCTCGTT', 'AGTGATGGT', 'AGTGCTCCA', 'AGTTAAATA', 'AGTTCGAGT', 'AGTTGACTT', 'AGTTGCCGT', 'AGTTGGCGC', 'AGTTGGTAG', 'AGTTGTCGA', 'AGTTTGGCA', 'ATAAAATAT', 'ATAACCCGA', 'ATAAGACGC', 'ATAAGATGC', 'ATAAGCCGC', 'ATAAGCGTA', 'ATAAGGCAC', 'ATAAGGCGG', 'ATAAGGCGT', 'ATAATCTAC', 'ATACAGCGA', 'ATACCCCAA', 'ATACCGCTA', 'ATAGCCTGA', 'ATAGCGTCG', 'ATAGCTCAG', 'ATATCAGCA', 'ATATGGATT', 'ATATGGCGG', 'ATATTAATA', 'ATATTGGTG', 'ATATTTTTT', 'ATCAACGCC', 'ATCAATGCC', 'ATCAATTGG', 'ATCACCCAC', 'ATCAGCACC', 'ATCAGCAGC', 'ATCAGGCAA', 'ATCAGGCAG', 'ATCAGGCAT', 'ATCAGGCCT', 'ATCAGGCGT', 'ATCATGCCT', 'ATCCAGCGT', 'ATCCAGCTG', 'ATCCCCCCG', 'ATCCCCGCT', 'ATCCCGTCA', 'ATCCGACAA', 'ATCCGACAT', 'ATCCGACCT', 'ATCCGCCCT', 'ATCCGCGCA', 'ATCCGGCAA', 'ATCCGGCAG', 'ATCCGGCCC', 'ATCCGGCCT', 'ATCCGGGAG', 'ATCCTGCAC', 'ATCCTTCCC', 'ATCGCAGCG', 'ATCGCATCC', 'ATCGGCATC', 'ATCGGGAAA', 'ATCGTTTGA', 'ATCTAACGC', 'ATCTATTCA', 'ATCTGCGCA', 'ATCTGTAGG', 'ATCTTCTTC', 'ATCTTTCTG', 'ATGAAATGA', 'ATGAAATTT', 'ATGAAGCAA', 'ATGATGAAA', 'ATGCATCGG', 'ATGCCGCAT', 'ATGCCTACA', 'ATGCCTGAT', 'ATGCGACGC', 'ATGCGCAAG', 'ATGCGCCGC', 'ATGCGCTTT', 'ATGCGGCGC', 'ATGCGGCGT', 'ATGGCACTA', 'ATGGCGGTG', 'ATGGTGCAT', 'ATGGTGGTG', 'ATTACGCGT', 'ATTACTCAG', 'ATTAGCTCA', 'ATTATTGCG', 'ATTCATCTT', 'ATTCCGCCA', 'ATTCGAACC', 'ATTCTGGTG', 'ATTGACTCG', 'ATTGCGGAT', 'ATTGCGGCA', 'ATTGGTCGC', 'ATTTAGCGT', 'ATTTGTAGG', 'ATTTTGTAG', 'CAAAAGTTG', 'CAAAATCGC', 'CAAAGCCGC', 'CAAAGCGCG', 'CAAATCAAC', 'CAAATCCGG', 'CAACAACCG', 'CAACAGGCT', 'CAACCGATG', 'CAACCGGTT', 'CAACGCCTG', 'CAACGCTCT', 'CAACGGCTG', 'CAACGGTGG', 'CAACTGGCT', 'CAAGCGTCG', 'CAAGCTGGA', 'CAAGGAGGG', 'CAAGGTCGG', 'CAATAGCCT', 'CAATATCAG', 'CAATATTGG', 'CAATCAATG', 'CAATGCCTG', 'CAATTCCGC', 'CAATTGGTC', 'CACAATGCC', 'CACAGCGTC', 'CACCAGCGC', 'CACCCACCA', 'CACCCCGTA', 'CACCGCTGT', 'CACCGTTGC', 'CACCTCCCT', 'CACCTGAAG', 'CACCTTCGC', 'CACGACCCA', 'CACGACCTT', 'CACGACGTT', 'CACGACTGC', 'CACGCCGCA', 'CACGCTGCC', 'CACGGTCTG', 'CACGTCCGT', 'CACTAACAC', 'CACTATGGC', 'CACTGAACT', 'CACTGCGTT', 'CACTGGAGT', 'CACTGTAGG', 'CACTTGTGC', 'CAGAAAAAG', 'CAGAAGAAC', 'CAGAAGCAG', 'CAGAATATT', 'CAGACAGCG', 'CAGCAACAG', 'CAGCACGCC', 'CAGCAGCAA', 'CAGCAGCCG', 'CAGCAGGCC', 'CAGCCACAA', 'CAGCCCGCT', 'CAGCCGCAA', 'CAGCCTGGT', 'CAGCGCAAT', 'CAGCGCACC', 'CAGCGCTGC', 'CAGCGTCGC', 'CAGCTCCGG', 'CAGCTGAGC', 'CAGCTGGGA', 'CAGGAGTTA', 'CAGGCAACG', 'CAGGCAGTC', 'CAGGCATCT', 'CAGGCATTT', 'CAGGCCTAC', 'CAGGCTAAT', 'CAGGTCGAT', 'CAGGTGAAA', 'CAGGTTCGA', 'CAGTCATTC', 'CAGTCGGCA', 'CAGTTCCAG', 'CAGTTGACT', 'CAGTTGGCG', 'CAGTTGGTA', 'CAGTTGTCG', 'CATAACCCG', 'CATAGCGTC', 'CATCAACGC', 'CATCACCCA', 'CATCAGGCA', 'CATCAGGCG', 'CATCATCAT', 'CATCCAACG', 'CATCCCCCC', 'CATCCGACA', 'CATCCGGCA', 'CATCCGGGA', 'CATCCTGCA', 'CATCCTTCC', 'CATCGGGAA', 'CATCTAACG', 'CATCTGCGC', 'CATCTTTCT', 'CATGCCGAC', 'CATGCCTAC', 'CATTACGCG', 'CATTATTGC', 'CATTCATCT', 'CATTCTGAT', 'CCAAAGCGC', 'CCAACTGGC', 'CCAAGGTCG', 'CCAATTCCG', 'CCACCAGCA', 'CCACCCCGT', 'CCACCTCTT', 'CCACCTTCG', 'CCACGTCCG', 'CCAGAAGAA', 'CCAGACAGC', 'CCAGCAGCA', 'CCAGCAGGC', 'CCAGCTCTT', 'CCAGCTGAG', 'CCAGTTCCA', 'CCAGTTGTC', 'CCCACCAAT', 'CCCACCACT', 'CCCACGTCC', 'CCCCACGTC', 'CCCCCACGT', 'CCCCCCGGT', 'CCCCCGCAA', 'CCCCCGGTG', 'CCCCGCAAC', 'CCCCGCTGG', 'CCCCGGTCG', 'CCCCGGTGT', 'CCCCGTAGG', 'CCCCTCCAA', 'CCCGAAGGT', 'CCCGCAACC', 'CCCGCCGAA', 'CCCGCTCAC', 'CCCGCTCCA', 'CCCGCTGGC', 'CCCGGACGG', 'CCCGGTCGG', 'CCCGGTGTG', 'CCCGGTTTA', 'CCCGTACTT', 'CCCGTAGGT', 'CCCGTCATC', 'CCCTACATG', 'CCCTCCAAA', 'CCCTGCGGG', 'CCCTTACAA', 'CCCTTCGGG', 'CCGAACCGT', 'CCGAAGCGG', 'CCGAAGGTC', 'CCGACAACC', 'CCGACATCA', 'CCGACATCC', 'CCGACATTA', 'CCGACCGCT', 'CCGACCTAC', 'CCGACCTGT', 'CCGAGCCGG', 'CCGAGTACT', 'CCGATAAGC', 'CCGATGCCT', 'CCGCAACAA', 'CCGCAACCA', 'CCGCAGGCG', 'CCGCATCCG', 'CCGCCACCT', 'CCGCCCTAC', 'CCGCCGAAG', 'CCGCCGTCG', 'CCGCGCAAA', 'CCGCTACTA', 'CCGCTATTG', 'CCGCTCACT', 'CCGCTCCAA', 'CCGCTCGGT', 'CCGCTGACG', 'CCGCTGGCG', 'CCGCTGTGA', 'CCGCTGTTC', 'CCGCTTGGC', 'CCGCTTTCT', 'CCGGACGGT', 'CCGGATAAG', 'CCGGATGCG', 'CCGGCAATC', 'CCGGCAGTT', 'CCGGCCCCC', 'CCGGCCTAC', 'CCGGGAGGA', 'CCGGTCGGG', 'CCGGTGCCT', 'CCGGTGTGT', 'CCGGTTGCC', 'CCGGTTGCG', 'CCGGTTTAT', 'CCGTACTTT', 'CCGTAGGCC', 'CCGTAGGTC', 'CCGTCATCA', 'CCGTCGAAG', 'CCGTTGCCG', 'CCTACAAAA', 'CCTACAACT', 'CCTACACCG', 'CCTACATGT', 'CCTACGCCA', 'CCTACGGAG', 'CCTACGGAT', 'CCTACGGGG', 'CCTACGGTT', 'CCTCCAAAA', 'CCTCCCTTA', 'CCTCCGACC', 'CCTGAAGCT', 'CCTGATAAG', 'CCTGATGCG', 'CCTGATTTA', 'CCTGCACGA', 'CCTGCGGCA', 'CCTGCGGGC', 'CCTGGCGCT', 'CCTGGTAGC', 'CCTGTAGGC', 'CCTTACAAG', 'CCTTACCGC', 'CCTTATCCG', 'CCTTCCCCG', 'CCTTCGGGT', 'CCTTGCCAA', 'CGAAAAAAA', 'CGAACCGTA', 'CGAACCTCC', 'CGAAGCCGC', 'CGAAGCGGG', 'CGAAGCTTC', 'CGAAGGTCG', 'CGAAGTTGA', 'CGAATCCTG', 'CGACAACCG', 'CGACATCAA', 'CGACATCCA', 'CGACATTAT', 'CGACCCACC', 'CGACCGCTC', 'CGACCTACG', 'CGACCTGTA', 'CGACCTTGC', 'CGACGCGGC', 'CGACGCTGG', 'CGACGCTGT', 'CGACGCTTA', 'CGACGCTTG', 'CGACTGCCG', 'CGACTTATC', 'CGAGCCGGT', 'CGAGCGCCT', 'CGAGCTCTT', 'CGAGGGGGG', 'CGAGTACTC', 'CGAGTCATC', 'CGAGTCTCG', 'CGAGTTCGA', 'CGATAAGCC', 'CGATACCCC', 'CGATCCCGT', 'CGATCCGCG', 'CGATGCCTG', 'CGCAAAGCC', 'CGCAACAAC', 'CGCAACCAA', 'CGCAAGCGT', 'CGCAAGCTG', 'CGCAATAGC', 'CGCACAATG', 'CGCACAGCG', 'CGCACCAAA', 'CGCACGACT', 'CGCAGGTTC', 'CGCATAGCG', 'CGCATCAGG', 'CGCATCCGA', 'CGCATCCGG', 'CGCATTACG', 'CGCCACCTT', 'CGCCAGACA', 'CGCCAGCAG', 'CGCCAGTTG', 'CGCCCTACA', 'CGCCCTGCG', 'CGCCCTTCG', 'CGCCGAAGC', 'CGCCGCAGC', 'CGCCGCATC', 'CGCCGCGCC', 'CGCCGCTGA', 'CGCCGTCGA', 'CGCCTGATG', 'CGCCTTATC', 'CGCGACTTA', 'CGCGAGCGC', 'CGCGAGTTC', 'CGCGCAAAG', 'CGCGCAAGC', 'CGCGCTTCG', 'CGCGGGGAA', 'CGCGGGGTG', 'CGCGTCGCA', 'CGCGTCTAC', 'CGCGTCTGC', 'CGCGTCTTA', 'CGCGTTAGC', 'CGCTACGGC', 'CGCTACTAA', 'CGCTATTGC', 'CGCTCACTG', 'CGCTCCAAA', 'CGCTCGCCC', 'CGCTCGGCA', 'CGCTCGGTT', 'CGCTCTCTC', 'CGCTGAAAG', 'CGCTGACGC', 'CGCTGATTG', 'CGCTGCGCG', 'CGCTGGCGC', 'CGCTGGTGG', 'CGCTGTAAT', 'CGCTGTCGC', 'CGCTGTGAA', 'CGCTTAACG', 'CGCTTCACC', 'CGCTTCGCC', 'CGCTTCGCT', 'CGCTTGGCG', 'CGCTTTCTT', 'CGCTTTGCT', 'CGCTTTGTT', 'CGGACGGTG', 'CGGAGGGTG', 'CGGATAAGA', 'CGGATAAGG', 'CGGATACGG', 'CGGATGCAT', 'CGGATGCGC', 'CGGATGCGG', 'CGGATGGCG', 'CGGCAACGC', 'CGGCAATCA', 'CGGCACTGG', 'CGGCAGTTG', 'CGGCCCCCG', 'CGGCCTACA', 'CGGCCTACG', 'CGGCGCGAG', 'CGGCGCTGG', 'CGGCGGCGG', 'CGGCGGTTC', 'CGGCGTAAA', 'CGGCGTGAA', 'CGGCTGCCG', 'CGGGAATAG', 'CGGGAATTT', 'CGGGAGGAT', 'CGGGCAGCC', 'CGGGCTCAT', 'CGGGGAACA', 'CGGGGAACT', 'CGGGGCTTC', 'CGGGGTCGC', 'CGGGGTGGA', 'CGGGTCGTT', 'CGGGTTTTT', 'CGGTCGGGG', 'CGGTCTGTC', 'CGGTGAGGG', 'CGGTGCCTT', 'CGGTGCTAC', 'CGGTGTGTG', 'CGGTTACGC', 'CGGTTATGT', 'CGGTTCAAA', 'CGGTTCGAT', 'CGGTTCGTA', 'CGGTTGCCT', 'CGGTTGCGC', 'CGGTTTATC', 'CGTAAACGC', 'CGTACGAGC', 'CGTACTTTC', 'CGTAGCCGA', 'CGTAGCGCA', 'CGTAGGCCG', 'CGTCATCAC', 'CGTCCGTAA', 'CGTCGAAGC', 'CGTCGCATC', 'CGTCGGGCT', 'CGTCGGTTC', 'CGTCTACCA', 'CGTCTTATC', 'CGTGAACGC', 'CGTGATCGT', 'CGTGATTTT', 'CGTGCTTCT', 'CGTGGACAG', 'CGTTAGCGT', 'CGTTAGCTC', 'CGTTCACGC', 'CGTTCACGG', 'CGTTCTTTA', 'CGTTGCCGG', 'CGTTGCCTG', 'CGTTGCTGC', 'CGTTTATGC', 'CGTTTCCCG', 'CTAACACCT', 'CTAACGCCC', 'CTAATGCGG', 'CTACAAAAT', 'CTACACCGC', 'CTACATGTG', 'CTACCAATT', 'CTACCGCTA', 'CTACGCCAG', 'CTACGGAGG', 'CTACGGATG', 'CTACGGGGT', 'CTACGGTTA', 'CTACTAAAG', 'CTAGCGCGT', 'CTATCCAGC', 'CTATGGCAC', 'CTATTGCCC', 'CTCACTGCG', 'CTCAGCGCT', 'CTCAGCTGG', 'CTCAGTTGG', 'CTCATAACC', 'CTCATCCCC', 'CTCATCCTT', 'CTCCAAAAG', 'CTCCACCCC', 'CTCCCTTAC', 'CTCCGACCG', 'CTCGCCCTG', 'CTCGCTTCG', 'CTCGGTTCG', 'CTCGTCGGG', 'CTCGTTTCC', 'CTCTATCCA', 'CTCTCGCTG', 'CTCTCTCGC', 'CTCTTCTTT', 'CTGAAAGAA', 'CTGAACTGT', 'CTGAAGCTA', 'CTGACCGAT', 'CTGACGCGA', 'CTGAGCTAC', 'CTGATAAGA', 'CTGATAAGC', 'CTGATGCGA', 'CTGATGCGC', 'CTGATTTAG', 'CTGCACGAC', 'CTGCAGCTG', 'CTGCCAGCG', 'CTGCCCCTC', 'CTGCCGGAT', 'CTGCGCACG', 'CTGCGCCTG', 'CTGCGCGCT', 'CTGCGGCAA', 'CTGCGGGCA', 'CTGCGTTCA', 'CTGCTCCCT', 'CTGCTGAAA', 'CTGGAACAG', 'CTGGAGTTT', 'CTGGCAGTC', 'CTGGCAGTT', 'CTGGCGCAG', 'CTGGCGCGG', 'CTGGCGCGT', 'CTGGCGCTG', 'CTGGCGGAT', 'CTGGCGGCA', 'CTGGCGGCG', 'CTGGCTGGC', 'CTGGCTGTC', 'CTGGGAGAG', 'CTGGGGTAC', 'CTGGTAGCT', 'CTGTAGGCC', 'CTGTAGGTC', 'CTGTCCAAC', 'CTGTCGCCA', 'CTGTCGCGT', 'CTGTGAAGT', 'CTGTTCATA', 'CTTAACGCG', 'CTTACAAGG', 'CTTACCGCT', 'CTTATCAGG', 'CTTATCATG', 'CTTATCCGC', 'CTTATCCGG', 'CTTCCCCGC', 'CTTCGCCCT', 'CTTCGCTCG', 'CTTCGGGTC', 'CTTCTCATC', 'CTTCTTTAA', 'CTTGAACCC', 'CTTGCCAAG', 'CTTGGCGAT', 'CTTGTGCCG', 'CTTTAAATA', 'CTTTCGTAC', 'CTTTCTGCC', 'CTTTCTTTT', 'CTTTGCTTA', 'CTTTTAATC', 'CTTTTGAAA', 'CTTTTGGGT', 'GAAAAAAAA', 'GAAAAAGCC', 'GAAACTGAC', 'GAAAGAAGC', 'GAAAGCCAG', 'GAAAGCGGC', 'GAAAGTGAT', 'GAAATGATG', 'GAACAGCAA', 'GAACCCCCA', 'GAACCGTAG', 'GAACCTCCG', 'GAACGCCTT', 'GAACTGGAA', 'GAACTGTAG', 'GAAGAAAGC', 'GAAGAACAG', 'GAAGAGATC', 'GAAGCCGCT', 'GAAGCGGGT', 'GAAGCTAGC', 'GAAGCTTCT', 'GAAGGATTA', 'GAAGGTCGT', 'GAAGTGCTC', 'GAAGTTGAA', 'GAATAGCTC', 'GAATCCTGC', 'GAATCTGTA', 'GAATGCCGG', 'GAATTTGTA', 'GACAACCGA', 'GACAGCGCA', 'GACAGTCAT', 'GACATCAAC', 'GACATCCAA', 'GACATTATT', 'GACCCACCA', 'GACCGATAA', 'GACCGCTCG', 'GACCTACGG', 'GACCTGTAG', 'GACCTTGCC', 'GACCTTTCG', 'GACGCACAG', 'GACGCATAG', 'GACGCATTA', 'GACGCGACT', 'GACGCGCAA', 'GACGCGGGG', 'GACGCGTTA', 'GACGCTGGC', 'GACGCTGTC', 'GACGCTTAA', 'GACGGTGCT', 'GACTCGCTT', 'GACTGCCGG', 'GACTTATCA', 'GACTTGAAC', 'GACTTTTAA', 'GAGAGCACC', 'GAGATGGGA', 'GAGATGGTG', 'GAGCACCTC', 'GAGCACGAC', 'GAGCAGCCT', 'GAGCAGTTG', 'GAGCCGGTT', 'GAGCGCCTT', 'GAGCTACGG', 'GAGCTCTTC', 'GAGGATTCG', 'GAGGGGGGG', 'GAGGGGGTC', 'GAGGGTGCG', 'GAGTACTCT', 'GAGTCATCC', 'GAGTCTCGT', 'GAGTTAAAT', 'GAGTTCGAG', 'GAGTTTGGC', 'GATAAGACG', 'GATAAGATG', 'GATAAGCCG', 'GATAAGCGT', 'GATAAGGCA', 'GATAAGGCG', 'GATACCCCA', 'GATACCGCT', 'GATACGGGC', 'GATCAGCAC', 'GATCCCGTC', 'GATCCGCGC', 'GATCGGTTC', 'GATGAAATG', 'GATGCATCG', 'GATGCCTGA', 'GATGCGACG', 'GATGCGCAA', 'GATGCGCCG', 'GATGCGCTT', 'GATGCGGCG', 'GATGGTGCA', 'GATGGTGGT', 'GATTACTCA', 'GATTAGCTC', 'GATTCGAAC', 'GATTGACTC', 'GATTGCCGA', 'GATTTAGCG', 'GATTTTGTA', 'GCAAAGCCG', 'GCAACAACC', 'GCAACAGGC', 'GCAACCAAT', 'GCAACGCTC', 'GCAACGGCT', 'GCAAGCGTC', 'GCAAGCTGG', 'GCAATAGCC', 'GCAATCAAT', 'GCACAATGC', 'GCACAGCGT', 'GCACCGTTG', 'GCACCTCCC', 'GCACGACCC', 'GCACGACCT', 'GCACGACTG', 'GCACTATGG', 'GCACTGAAC', 'GCACTGGAG', 'GCACTTGTG', 'GCAGAAAAA', 'GCAGAAGCA', 'GCAGAATAT', 'GCAGAGAAG', 'GCAGCCACA', 'GCAGCCCGC', 'GCAGCCGCA', 'GCAGCCTGG', 'GCAGCTCCG', 'GCAGGAAGG', 'GCAGGTTCG', 'GCAGTCGGC', 'GCAGTTGAC', 'GCAGTTGGC', 'GCATAGCGT', 'GCATCAGGC', 'GCATCCGAC', 'GCATCCGGC', 'GCATCCGGG', 'GCATCGGGA', 'GCATCTGCG', 'GCATTACGC', 'GCCAAAGCG', 'GCCAAGGTC', 'GCCACCTTC', 'GCCAGACAG', 'GCCAGCAGC', 'GCCAGCAGG', 'GCCAGCCAC', 'GCCAGTTGT', 'GCCCCCGCA', 'GCCCCTCCA', 'GCCCGCTCA', 'GCCCGTACT', 'GCCCTACAT', 'GCCCTGCGG', 'GCCCTTCGG', 'GCCGAACCG', 'GCCGAAGCG', 'GCCGACCAG', 'GCCGACCTG', 'GCCGAGGAT', 'GCCGAGTAC', 'GCCGCAACA', 'GCCGCATCC', 'GCCGCCAGT', 'GCCGCCGCC', 'GCCGCCGTC', 'GCCGCTATT', 'GCCGCTGAC', 'GCCGCTTTC', 'GCCGGATAA', 'GCCGGATGC', 'GCCGGTATC', 'GCCGGTTGC', 'GCCGTCGAA', 'GCCTACAAA', 'GCCTACAAC', 'GCCTACACC', 'GCCTACGCC', 'GCCTACGGA', 'GCCTACGGG', 'GCCTGATAA', 'GCCTGATGC', 'GCCTGATTT', 'GCCTGCGCC', 'GCCTGCGGC', 'GCCTGGTAG', 'GCCTTACCG', 'GCCTTATCC', 'GCGAAAGTG', 'GCGACCAGC', 'GCGACGCTG', 'GCGACGCTT', 'GCGACTTAT', 'GCGAGCGCC', 'GCGAGGGGG', 'GCGAGTTCG', 'GCGATACCC', 'GCGCAAAGC', 'GCGCAAGCG', 'GCGCAATAG', 'GCGCACAAT', 'GCGCACGAC', 'GCGCATCAG', 'GCGCCAGTT', 'GCGCCGCTG', 'GCGCCTTAT', 'GCGCGAGCG', 'GCGCGCTTC', 'GCGCGGGGA', 'GCGCGTCTA', 'GCGCGTCTG', 'GCGCGTCTT', 'GCGCTACGG', 'GCGCTGCGC', 'GCGCTGCTC', 'GCGCTGGAA', 'GCGCTGGCG', 'GCGCTTCGC', 'GCGCTTTGC', 'GCGGACTGA', 'GCGGATGCG', 'GCGGATTCG', 'GCGGCAACG', 'GCGGCACTG', 'GCGGCGCGA', 'GCGGCGGCG', 'GCGGCGTAA', 'GCGGCGTGA', 'GCGGGAATA', 'GCGGGAATT', 'GCGGGCAGC', 'GCGGGGAAC', 'GCGGGGTGG', 'GCGGGTTTT', 'GCGGTGAGG', 'GCGGTTACG', 'GCGGTTCGA', 'GCGGTTTAT', 'GCGTAAACG', 'GCGTAGCGC', 'GCGTCGCAT', 'GCGTCTACC', 'GCGTCTTAT', 'GCGTGAACG', 'GCGTGATTT', 'GCGTTAGCG', 'GCGTTCACG', 'GCGTTTATG', 'GCTAATGCG', 'GCTACCGCT', 'GCTACGGAT', 'GCTACTAAA', 'GCTAGCGCG', 'GCTATAGCC', 'GCTATTGCC', 'GCTCACTGC', 'GCTCAGCTG', 'GCTCAGTTG', 'GCTCATAAC', 'GCTCCACCC', 'GCTCGCCCT', 'GCTCGGTTC', 'GCTCGTCGG', 'GCTCTCTCG', 'GCTCTTCTT', 'GCTGACGCC', 'GCTGACGCG', 'GCTGAGCTA', 'GCTGATTGC', 'GCTGCAGCT', 'GCTGCCGGA', 'GCTGCGCGC', 'GCTGCTGAA', 'GCTGCTGCT', 'GCTGCTGGC', 'GCTGGAACA', 'GCTGGCAGT', 'GCTGGCGAT', 'GCTGGCGCG', 'GCTGGCTGG', 'GCTGGGAGA', 'GCTGGGGTA', 'GCTGTCGCC', 'GCTGTCGCG', 'GCTGTGAAG', 'GCTTAACGC', 'GCTTATCCG', 'GCTTCGCCC', 'GCTTCGCTC', 'GCTTCTCAT', 'GCTTGGCGA', 'GCTTTCTTT', 'GCTTTGCTT', 'GCTTTGTTG', 'GGAACAGCA', 'GGAAGGATT', 'GGAATAGCT', 'GGAATGCCG', 'GGAATTTGT', 'GGACAGTCA', 'GGACGGTGC', 'GGACTTGAA', 'GGAGAGCAC', 'GGAGCAGCC', 'GGAGGATTC', 'GGAGGGGGT', 'GGAGGGTGC', 'GGAGTTAAA', 'GGAGTTAAG', 'GGAGTTTGG', 'GGATAAGAC', 'GGATAAGAT', 'GGATAAGGC', 'GGATACGGG', 'GGATGCATC', 'GGATGCGCT', 'GGATGCGGC', 'GGATTACTC', 'GGATTCGAA', 'GGATTGACT', 'GGCAACGCT', 'GGCAACGGC', 'GGCAATCAA', 'GGCACCGTT', 'GGCACTATG', 'GGCACTGGA', 'GGCACTTGT', 'GGCAGAATA', 'GGCAGCCCG', 'GGCAGGAAG', 'GGCAGTCGG', 'GGCAGTTGG', 'GGCATCTGC', 'GGCCCCCGC', 'GGCCGGATA', 'GGCCTACAA', 'GGCCTACAC', 'GGCCTACGA', 'GGCCTACGC', 'GGCCTACGG', 'GGCCTGATA', 'GGCGATACC', 'GGCGCACAA', 'GGCGCAGGC', 'GGCGCGAGC', 'GGCGCGGGG', 'GGCGCGTCT', 'GGCGCTGCT', 'GGCGCTGGA', 'GGCGCTGGC', 'GGCGGATGC', 'GGCGGTGAG', 'GGCGGTTAC', 'GGCGGTTCG', 'GGCGTAAAC', 'GGCGTGAAC', 'GGCGTTCAC', 'GGCGTTTAT', 'GGCTAATGC', 'GGCTCATAA', 'GGCTGCCGG', 'GGCTGGCGT', 'GGCTGGGGT', 'GGCTGTCGC', 'GGCTTCTCA', 'GGGAACTCG', 'GGGAACTCT', 'GGGAAGGAT', 'GGGAATAGC', 'GGGAATTTG', 'GGGACTTGA', 'GGGAGAGCA', 'GGGAGGATT', 'GGGATTGAC', 'GGGCAGAAT', 'GGGCAGCCC', 'GGGCTCATA', 'GGGCTTCTC', 'GGGGAACAC', 'GGGGAACTC', 'GGGGAAGGA', 'GGGGACTTG', 'GGGGATTGA', 'GGGGCAAAA', 'GGGGCTTCT', 'GGGGGAAGG', 'GGGGGACTT', 'GGGGGATTG', 'GGGGGGACT', 'GGGGGGATT', 'GGGGGGGAC', 'GGGGGGGAT', 'GGGGGGGGA', 'GGGGGTCGG', 'GGGGTCGCG', 'GGGGTCGGC', 'GGGGTGGAG', 'GGGTCAAAA', 'GGGTCGCGA', 'GGGTCGGCG', 'GGGTCGTTA', 'GGGTCGTTG', 'GGGTGATTA', 'GGGTGCGGG', 'GGGTGGAGC', 'GGGTTTTTA', 'GGTAAAGTG', 'GGTAGAGCA', 'GGTAGCTCG', 'GGTCAAAAG', 'GGTCGATCC', 'GGTCGCAGG', 'GGTCGCGAG', 'GGTCGGATA', 'GGTCGGCGG', 'GGTCGGGGC', 'GGTCGGGGT', 'GGTCGTCGG', 'GGTCGTTAG', 'GGTCGTTGC', 'GGTCTGTCC', 'GGTGAAACT', 'GGTGAGGGG', 'GGTGATGTT', 'GGTGATTAG', 'GGTGCACTG', 'GGTGCATCC', 'GGTGCCTTA', 'GGTGCGAGG', 'GGTGCGGGA', 'GGTGCTACC', 'GGTGGAGCA', 'GGTGGGGGA', 'GGTGGGTCA', 'GGTGGTGGG', 'GGTGTGTGC', 'GGTTAACAA', 'GGTTACGCC', 'GGTTATGTT', 'GGTTCAAAT', 'GGTTCGAAT', 'GGTTCGATC', 'GGTTCGTAG', 'GGTTGCCTG', 'GGTTGCGCC', 'GGTTTATCC', 'GGTTTTTAC', 'GTAAACGCC', 'GTACGAGCT', 'GTACTCTAT', 'GTACTTTCG', 'GTAGAGCAC', 'GTAGAGCAG', 'GTAGCCGAG', 'GTAGCGCAT', 'GTAGCTCGT', 'GTAGGCCGG', 'GTAGGCCTG', 'GTAGGTCGG', 'GTCAAAAGT', 'GTCACCATT', 'GTCATCACC', 'GTCATCCTG', 'GTCATTCAT', 'GTCCAACTG', 'GTCCGTAAG', 'GTCGAAGCC', 'GTCGAAGCT', 'GTCGATCCG', 'GTCGCAGGT', 'GTCGCATCA', 'GTCGCATCC', 'GTCGCCAGT', 'GTCGCGAGT', 'GTCGCGTCT', 'GTCGGATAA', 'GTCGGATGC', 'GTCGGCACC', 'GTCGGCGGT', 'GTCGGGCTC', 'GTCGGGGCT', 'GTCGGGGTC', 'GTCGGTTCA', 'GTCGTCGGT', 'GTCGTGGAC', 'GTCGTTAGC', 'GTCGTTGCC', 'GTCTACCAA', 'GTCTCGTTT', 'GTCTGCTTC', 'GTCTGTCCA', 'GTCTTATCA', 'GTCTTCAAT', 'GTGAAACTG', 'GTGAACGCC', 'GTGAAGTGC', 'GTGAGGGGG', 'GTGATCGTG', 'GTGATGGTG', 'GTGATTAGC', 'GTGATTTTG', 'GTGCACTGA', 'GTGCATCCG', 'GTGCCGAAC', 'GTGCCGCAT', 'GTGCCTTAC', 'GTGCGAGGG', 'GTGCGGGAA', 'GTGCTCCAC', 'GTGCTTCTT', 'GTGGACAGT', 'GTGGAGCAG', 'GTGGGGGAA', 'GTGGGTCAA', 'GTGGTGGGG', 'GTGTGCAAT', 'GTGTGTGCA', 'GTTAAATAA', 'GTTACGCCG', 'GTTAGCGTC', 'GTTAGCTCA', 'GTTATGTTC', 'GTTCAAATC', 'GTTCACGCC', 'GTTCACGGT', 'GTTCGAATC', 'GTTCGAGTC', 'GTTCGATCC', 'GTTCGCCAC', 'GTTCGTAGC', 'GTTGACGGC', 'GTTGACTTT', 'GTTGCCAGG', 'GTTGCCGGA', 'GTTGCCGTT', 'GTTGCCTGA', 'GTTGCCTGC', 'GTTGGCGCA', 'GTTGGTAGA', 'GTTTATCCC', 'GTTTATGCC', 'GTTTCCCGC', 'GTTTGGCAA', 'GTTTGTAGG', 'GTTTTTACG', 'TAAACGCCT', 'TAAATAATC', 'TAAATATGG', 'TAAATATTG', 'TAACACCTG', 'TAACCCGAA', 'TAACGCGTC', 'TAAGACGCA', 'TAAGACGCG', 'TAAGAGATG', 'TAAGATGCG', 'TAAGCCGCT', 'TAAGCGTAG', 'TAAGGCACT', 'TAAGGCGGT', 'TAAGGCGTT', 'TAATCAATT', 'TAATGCGGA', 'TACAAAATC', 'TACAAGGAG', 'TACACCGCT', 'TACCAATTC', 'TACCGCTAC', 'TACCGCTTG', 'TACGAGCTC', 'TACGCCAGA', 'TACGCCGCA', 'TACGCGTCG', 'TACGGAGGG', 'TACGGATGC', 'TACGGATGG', 'TACGGGGTG', 'TACGGTTAT', 'TACTAAAGC', 'TACTCAGCG', 'TACTCTATC', 'TACTTTCGT', 'TAGAGCACG', 'TAGAGCAGT', 'TAGCCGAGT', 'TAGCCTGAT', 'TAGCGCATC', 'TAGCGCGTC', 'TAGCGTCGC', 'TAGCGTGAT', 'TAGCTCAGC', 'TAGCTCAGT', 'TAGCTCGTC', 'TAGGCCGGA', 'TAGGCCTGA', 'TAGGGCAGA', 'TAGGTCGGA', 'TATAAAATA', 'TATCAGCAG', 'TATCAGGCC', 'TATCATGCC', 'TATCCAGCG', 'TATCCAGCT', 'TATCCCCGC', 'TATCCGACC', 'TATCCGCCC', 'TATCCGGCC', 'TATGCCGCA', 'TATGGATTA', 'TATGGCACT', 'TATGGCGGT', 'TATGTTCCG', 'TATTGCCCG', 'TATTGCGGC', 'TATTGGTGA', 'TCAAAAGTT', 'TCAAATCCG', 'TCAACGCCT', 'TCAATATTG', 'TCAATGCCT', 'TCAATTGGT', 'TCACCCACC', 'TCACGACGT', 'TCACGCCGC', 'TCACGGTCT', 'TCACTGCGT', 'TCAGCAGCC', 'TCAGCGCCT', 'TCAGCGCTG', 'TCAGCTGGG', 'TCAGGAGTT', 'TCAGGCAAC', 'TCAGGCAGT', 'TCAGGCATC', 'TCAGGCATT', 'TCAGGCCTA', 'TCAGGCGTT', 'TCAGTTGGT', 'TCATAACCC', 'TCATCACCC', 'TCATCCCCC', 'TCATCCGGC', 'TCATCCTGA', 'TCATCCTGC', 'TCATCCTTC', 'TCATCTTTC', 'TCATGCCTA', 'TCATTCATC', 'TCCAACTGG', 'TCCACCCCG', 'TCCAGACGA', 'TCCAGCTGA', 'TCCCCCCGG', 'TCCCCGCTG', 'TCCCGCTCC', 'TCCCGTCAT', 'TCCCTTACA', 'TCCGACAAC', 'TCCGACATC', 'TCCGACATT', 'TCCGACCGC', 'TCCGACCTA', 'TCCGCCACC', 'TCCGCCCTA', 'TCCGCGCAA', 'TCCGGCAAT', 'TCCGGCAGT', 'TCCGGCCCC', 'TCCGGCCTA', 'TCCGGGAGG', 'TCCGGTTAA', 'TCCTGCACG', 'TCCTTCCCC', 'TCGAACCCC', 'TCGAACCTC', 'TCGAACCTT', 'TCGAAGCCG', 'TCGAAGCTT', 'TCGAATCCT', 'TCGAGTCTC', 'TCGATCCCG', 'TCGATCCGC', 'TCGCAGGTT', 'TCGCATCAG', 'TCGCATCCG', 'TCGCCAGTT', 'TCGCCCTGC', 'TCGCCCTTC', 'TCGCGAGTT', 'TCGCGTCTT', 'TCGCTCGCC', 'TCGCTTCGC', 'TCGGAAAGC', 'TCGGATAAG', 'TCGGATGCG', 'TCGGCATCG', 'TCGGCGGTT', 'TCGGGCTCA', 'TCGGGGCTT', 'TCGGGGTCG', 'TCGGGTCGT', 'TCGGTTCAA', 'TCGGTTCGT', 'TCGGTTTAT', 'TCGTACGAG', 'TCGTAGCCG', 'TCGTCGGGC', 'TCGTCGGTT', 'TCGTGGACA', 'TCGTTAGCT', 'TCGTTGCCT', 'TCGTTTCCC', 'TCTAACGCC', 'TCTACCAAT', 'TCTATCCAG', 'TCTCACTCC', 'TCTCATCCC', 'TCTCATCCT', 'TCTCCGTTC', 'TCTCGTTTC', 'TCTCTCGCT', 'TCTGCCCCT', 'TCTGCGCAC', 'TCTGTAGGC', 'TCTGTCCAA', 'TCTTATCAG', 'TCTTATCAT', 'TCTTCTTTA', 'TCTTTAAAT', 'TCTTTCTGC', 'TCTTTTGGG', 'TGAAACTGA', 'TGAAAGAAG', 'TGAAAGTGA', 'TGAAATGAT', 'TGAACCCCC', 'TGAACGCCT', 'TGAACTGGC', 'TGAACTGTA', 'TGAAGCTAG', 'TGAAGTGCT', 'TGAATCAGC', 'TGACCGATA', 'TGACGCGAC', 'TGACTCGCT', 'TGACTTTTA', 'TGAGCTACG', 'TGAGGGGGG', 'TGATAAAAA', 'TGATAAGAC', 'TGATAAGCG', 'TGATACCGC', 'TGATCCAGT', 'TGATGAAAT', 'TGATGAAGC', 'TGATGCGAC', 'TGATGCGCC', 'TGATGGTGG', 'TGATGTTGC', 'TGATTAGCT', 'TGATTTAGC', 'TGATTTTGT', 'TGCACCTTT', 'TGCACGACC', 'TGCACTGAA', 'TGCAGCTGA', 'TGCATAATC', 'TGCATCCGG', 'TGCATCGGG', 'TGCCAAGGT', 'TGCCCCTCC', 'TGCCGAACC', 'TGCCGACCT', 'TGCCGCATC', 'TGCCGGATG', 'TGCCTGATG', 'TGCCTGCGG', 'TGCCTTACC', 'TGCGACGCT', 'TGCGAGGGG', 'TGCGCACGA', 'TGCGCCGCT', 'TGCGCCTGT', 'TGCGCGCTT', 'TGCGCTTTG', 'TGCGGATTC', 'TGCGGCAAC', 'TGCGGCACT', 'TGCGGCGCG', 'TGCGGCGTA', 'TGCGGCGTG', 'TGCGGGAAT', 'TGCGGGCAG', 'TGCGTATCG', 'TGCGTTCAC', 'TGCTCCACC', 'TGCTCCCTT', 'TGCTGAAAA', 'TGCTGAAAC', 'TGCTTATCC', 'TGCTTCTTC', 'TGGAACAGC', 'TGGACAGTC', 'TGGAGCAGC', 'TGGAGTTTG', 'TGGCAACAG', 'TGGCAATGG', 'TGGCACTAT', 'TGGCGATAC', 'TGGCGCACA', 'TGGCGCGGG', 'TGGCGCGTC', 'TGGCGCTGC', 'TGGCGGATG', 'TGGCGGTGA', 'TGGCTGGGG', 'TGGCTGTCG', 'TGGGAGAGC', 'TGGGCAGAA', 'TGGGGGAAG', 'TGGGTATAG', 'TGGGTCAAA', 'TGGTAGAGC', 'TGGTAGCTC', 'TGGTCGCAG', 'TGGTGCATC', 'TGGTGCGAG', 'TGGTGGGGG', 'TGGTGGTGG', 'TGTAGGCCT', 'TGTAGGTCG', 'TGTCCAACT', 'TGTCGCCAG', 'TGTCGCGTC', 'TGTCGGATG', 'TGTCGTGGA', 'TGTGAAGTG', 'TGTGCAATA', 'TGTGCCGAA', 'TGTGCCGCA', 'TGTGTGCAA', 'TGTTCATAT', 'TTAAATAAT', 'TTAAATATG', 'TTAAATGAT', 'TTAACGCGT', 'TTAATCAAT', 'TTACAAGGA', 'TTACCGCTT', 'TTACGCCGC', 'TTACGCGTC', 'TTACGTAAA', 'TTACTCAGC', 'TTAGCGTCG', 'TTAGCGTGA', 'TTAGCTCAG', 'TTATCAAAA', 'TTATCAGGC', 'TTATCATGC', 'TTATCCCCG', 'TTATCCGCC', 'TTATCCGGC', 'TTATGCCGC', 'TTATGTTCC', 'TTATTGCGG', 'TTCAAATCC', 'TTCAATATT', 'TTCACGACG', 'TTCACGCCG', 'TTCACGGTC', 'TTCATCTTT', 'TTCCCGCTC', 'TTCCGCCAC', 'TTCCGGGTA', 'TTCGAACCT', 'TTCGAATCC', 'TTCGAGTCT', 'TTCGATCCC', 'TTCGCCCTT', 'TTCGCTCGC', 'TTCGGGTCG', 'TTCGTACGA', 'TTCGTAGCC', 'TTCTCATCC', 'TTCTGCCCC', 'TTCTTTAAA', 'TTCTTTTGG', 'TTGAAAGTG', 'TTGAACCCC', 'TTGAAGTTG', 'TTGACTCGC', 'TTGACTTTT', 'TTGATACCG', 'TTGCCAAGG', 'TTGCCGACC', 'TTGCCGCCG', 'TTGCCGGAT', 'TTGCCGTTA', 'TTGCCTGAT', 'TTGCCTGCG', 'TTGCGGATT', 'TTGCGGCAC', 'TTGCTTATC', 'TTGGCAACA', 'TTGGCGATA', 'TTGGCGCAC', 'TTGGGTATA', 'TTGGTAGAG', 'TTGGTCGCA', 'TTGGTGCGA', 'TTGTAGGCC', 'TTGTAGGTC', 'TTGTGCCGC', 'TTTAAATAT', 'TTTAATCAA', 'TTTACCGCT', 'TTTACGTAA', 'TTTAGCGTG', 'TTTATCCCC', 'TTTATCGCC', 'TTTATGCCG', 'TTTCAATAT', 'TTTCCCGCT', 'TTTCGTACG', 'TTTCTGCCC', 'TTTCTTTTG', 'TTTGAAAGT', 'TTTGCTTAT', 'TTTGGCAAC', 'TTTGGGTAT', 'TTTGTAGGC', 'TTTGTAGGT', 'TTTGTGCTG', 'TTTTAATCA', 'TTTTACGTA', 'TTTTGAAAG', 'TTTTGGGTA', 'TTTTGTAGG', 'TTTTTACGT']
#print(len(a))