skip newsgroup header (#5585)
This commit is contained in:
parent
5b0967a08f
commit
65ce238f03
@ -66,7 +66,11 @@ for name in sorted(os.listdir(TEXT_DATA_DIR)):
|
|||||||
f = open(fpath)
|
f = open(fpath)
|
||||||
else:
|
else:
|
||||||
f = open(fpath, encoding='latin-1')
|
f = open(fpath, encoding='latin-1')
|
||||||
texts.append(f.read())
|
t = f.read()
|
||||||
|
i = t.find('\n\n') # skip header
|
||||||
|
if 0 < i:
|
||||||
|
t = t[i:]
|
||||||
|
texts.append(t)
|
||||||
f.close()
|
f.close()
|
||||||
labels.append(label_id)
|
labels.append(label_id)
|
||||||
|
|
||||||
@ -141,4 +145,4 @@ model.compile(loss='categorical_crossentropy',
|
|||||||
|
|
||||||
# happy learning!
|
# happy learning!
|
||||||
model.fit(x_train, y_train, validation_data=(x_val, y_val),
|
model.fit(x_train, y_train, validation_data=(x_val, y_val),
|
||||||
epochs=2, batch_size=128)
|
epochs=10, batch_size=128)
|
||||||
|
Loading…
Reference in New Issue
Block a user