skip newsgroup header (#5585)

This commit is contained in:
Hiroya Chiba 2017-03-04 10:45:54 +09:00 committed by François Chollet
parent 5b0967a08f
commit 65ce238f03

@ -66,7 +66,11 @@ for name in sorted(os.listdir(TEXT_DATA_DIR)):
f = open(fpath)
else:
f = open(fpath, encoding='latin-1')
texts.append(f.read())
t = f.read()
i = t.find('\n\n') # skip header
if 0 < i:
t = t[i:]
texts.append(t)
f.close()
labels.append(label_id)
@ -141,4 +145,4 @@ model.compile(loss='categorical_crossentropy',
# happy learning!
model.fit(x_train, y_train, validation_data=(x_val, y_val),
epochs=2, batch_size=128)
epochs=10, batch_size=128)