skip newsgroup header (#5585)
This commit is contained in:
parent
5b0967a08f
commit
65ce238f03
@ -66,7 +66,11 @@ for name in sorted(os.listdir(TEXT_DATA_DIR)):
|
||||
f = open(fpath)
|
||||
else:
|
||||
f = open(fpath, encoding='latin-1')
|
||||
texts.append(f.read())
|
||||
t = f.read()
|
||||
i = t.find('\n\n') # skip header
|
||||
if 0 < i:
|
||||
t = t[i:]
|
||||
texts.append(t)
|
||||
f.close()
|
||||
labels.append(label_id)
|
||||
|
||||
@ -141,4 +145,4 @@ model.compile(loss='categorical_crossentropy',
|
||||
|
||||
# happy learning!
|
||||
model.fit(x_train, y_train, validation_data=(x_val, y_val),
|
||||
epochs=2, batch_size=128)
|
||||
epochs=10, batch_size=128)
|
||||
|
Loading…
Reference in New Issue
Block a user