2014-01-10 16:21:35 +01:00
|
|
|
#!/usr/bin/env python2
|
|
|
|
|
|
|
|
import gzip
|
|
|
|
import random
|
|
|
|
import sys
|
|
|
|
|
|
|
|
sizeOfA = 10 * 1000
|
|
|
|
sizeOfB = 20
|
|
|
|
|
|
|
|
print sys.argv
|
2014-06-18 18:19:43 +02:00
|
|
|
if len(sys.argv) == 5:
|
|
|
|
sizeOfA = int(sys.argv[3])
|
|
|
|
sizeOfB = int(sys.argv[4])
|
2014-01-10 16:21:35 +01:00
|
|
|
|
|
|
|
# read all words
|
2014-06-18 18:19:43 +02:00
|
|
|
lines = [line.strip() for line in gzip.open(sys.argv[1])]
|
2014-01-10 16:21:35 +01:00
|
|
|
|
|
|
|
# get A lines
|
|
|
|
A = random.sample(lines, sizeOfA + sizeOfB)
|
|
|
|
|
|
|
|
# get B from the first sieOfB element
|
|
|
|
B = A[:sizeOfB]
|
|
|
|
A = A[sizeOfB:]
|
|
|
|
|
2014-06-18 18:19:43 +02:00
|
|
|
SetsFile = open(sys.argv[2], 'w')
|
2014-01-10 16:21:35 +01:00
|
|
|
SetsFile.write('const int lenA = ' + str(sizeOfA) + ';\n')
|
2014-09-24 22:51:53 +02:00
|
|
|
SetsFile.write('const char* const A[' + str(sizeOfA) + '] = {')
|
2014-01-10 16:21:35 +01:00
|
|
|
SetsFile.writelines(",".join('"' + x + '"\n' for x in A))
|
|
|
|
SetsFile.write('};\n')
|
|
|
|
|
|
|
|
SetsFile.write('const int lenB = ' + str(sizeOfB) + ';\n')
|
2014-09-24 22:51:53 +02:00
|
|
|
SetsFile.write('const char* const B[' + str(sizeOfB) + '] = {')
|
2014-01-10 16:21:35 +01:00
|
|
|
SetsFile.writelines(",".join('"' + x + '"\n' for x in B))
|
|
|
|
SetsFile.write('};\n')
|
|
|
|
|
|
|
|
print("sets.h: sizeOfA = " + str(len(A) + len(B)) + " generated...")
|