800 20681 , 38 .. ? ? , 20681 ? 800 ?
61722 3 20681 - 3 , . 3 ?
, , , . Python repr() - .
Windows? , open(filename, 'rb').
, , delimeter=" " (, , ). delimiter="\t".
, :
DEBUG = True
f = open('v2-host_tfdf_en.txt', 'rb')
if DEBUG:
rawdata = f.read(200)
f.seek(0)
print 'rawdata', repr(rawdata)
tfdf_Reader = csv.reader(f,delimiter=' ')
c = 0
for row in tfdf_Reader:
c = c + 1
if DEBUG and c <= 10:
print "row", c, repr(row)
print "rowcount", c
: Error: field larger than field limit (131072), , 128 .
, :
(a) - ; TEXT. , , , .
(b) (, ), , . , ( Notepad ++, View/Show Symbol/Show all characters). , csv, - :
f = open('v2-host_tfdf_en.txt', 'r') # NOT 'rb'
rows = [line.split() for line in f]