2015-12-09 02:49:14 +00:00
|
|
|
'''Train a recurrent convolutional network on the IMDB sentiment
|
|
|
|
classification task.
|
|
|
|
|
|
|
|
GPU command:
|
2016-01-29 21:31:53 +00:00
|
|
|
THEANO_FLAGS=mode=FAST_RUN,device=gpu,floatX=float32 python imdb_cnn_lstm.py
|
2015-12-09 02:49:14 +00:00
|
|
|
|
|
|
|
Get to 0.8498 test accuracy after 2 epochs. 41s/epoch on K520 GPU.
|
|
|
|
'''
|
|
|
|
|
2015-10-23 20:19:27 +00:00
|
|
|
from __future__ import print_function
|
|
|
|
import numpy as np
|
|
|
|
np.random.seed(1337) # for reproducibility
|
|
|
|
|
|
|
|
from keras.preprocessing import sequence
|
|
|
|
from keras.models import Sequential
|
|
|
|
from keras.layers.core import Dense, Dropout, Activation
|
|
|
|
from keras.layers.embeddings import Embedding
|
|
|
|
from keras.layers.recurrent import LSTM, GRU, SimpleRNN
|
|
|
|
from keras.layers.convolutional import Convolution1D, MaxPooling1D
|
|
|
|
from keras.datasets import imdb
|
|
|
|
|
|
|
|
|
2015-10-25 03:39:06 +00:00
|
|
|
# Embedding
|
2015-10-23 20:19:27 +00:00
|
|
|
max_features = 20000
|
2015-10-25 03:39:06 +00:00
|
|
|
maxlen = 100
|
2015-10-24 21:07:47 +00:00
|
|
|
embedding_size = 128
|
2015-10-23 20:19:27 +00:00
|
|
|
|
2015-10-25 03:39:06 +00:00
|
|
|
# Convolution
|
2015-10-23 20:19:27 +00:00
|
|
|
filter_length = 3
|
|
|
|
nb_filter = 64
|
2015-10-24 21:07:47 +00:00
|
|
|
pool_length = 2
|
2015-10-23 20:19:27 +00:00
|
|
|
|
2015-10-25 03:39:06 +00:00
|
|
|
# LSTM
|
2015-10-24 21:07:47 +00:00
|
|
|
lstm_output_size = 70
|
2015-10-23 20:19:27 +00:00
|
|
|
|
2015-10-25 03:39:06 +00:00
|
|
|
# Training
|
2015-10-23 20:19:27 +00:00
|
|
|
batch_size = 30
|
2015-10-24 21:07:47 +00:00
|
|
|
nb_epoch = 2
|
2015-10-25 03:39:06 +00:00
|
|
|
|
2015-10-23 20:19:27 +00:00
|
|
|
'''
|
|
|
|
Note:
|
|
|
|
batch_size is highly sensitive.
|
2015-10-25 03:39:06 +00:00
|
|
|
Only 2 epochs are needed as the dataset is very small.
|
2015-10-23 20:19:27 +00:00
|
|
|
'''
|
|
|
|
|
2015-12-09 02:49:14 +00:00
|
|
|
print('Loading data...')
|
2015-10-23 20:19:27 +00:00
|
|
|
(X_train, y_train), (X_test, y_test) = imdb.load_data(nb_words=max_features, test_split=0.2)
|
|
|
|
print(len(X_train), 'train sequences')
|
|
|
|
print(len(X_test), 'test sequences')
|
|
|
|
|
2015-12-09 02:49:14 +00:00
|
|
|
print('Pad sequences (samples x time)')
|
2015-10-23 20:19:27 +00:00
|
|
|
X_train = sequence.pad_sequences(X_train, maxlen=maxlen)
|
|
|
|
X_test = sequence.pad_sequences(X_test, maxlen=maxlen)
|
|
|
|
print('X_train shape:', X_train.shape)
|
|
|
|
print('X_test shape:', X_test.shape)
|
|
|
|
|
|
|
|
print('Build model...')
|
|
|
|
|
|
|
|
model = Sequential()
|
|
|
|
model.add(Embedding(max_features, embedding_size, input_length=maxlen))
|
|
|
|
model.add(Dropout(0.25))
|
|
|
|
model.add(Convolution1D(nb_filter=nb_filter,
|
|
|
|
filter_length=filter_length,
|
2015-12-09 02:49:14 +00:00
|
|
|
border_mode='valid',
|
|
|
|
activation='relu',
|
2015-10-23 20:19:27 +00:00
|
|
|
subsample_length=1))
|
|
|
|
model.add(MaxPooling1D(pool_length=pool_length))
|
2015-10-25 03:39:06 +00:00
|
|
|
model.add(LSTM(lstm_output_size))
|
2015-10-23 20:19:27 +00:00
|
|
|
model.add(Dense(1))
|
|
|
|
model.add(Activation('sigmoid'))
|
|
|
|
|
2015-10-25 03:39:06 +00:00
|
|
|
model.compile(loss='binary_crossentropy',
|
|
|
|
optimizer='adam',
|
2015-12-09 02:49:14 +00:00
|
|
|
class_mode='binary')
|
2015-10-23 20:19:27 +00:00
|
|
|
|
2015-12-09 02:49:14 +00:00
|
|
|
print('Train...')
|
2015-10-25 03:39:06 +00:00
|
|
|
model.fit(X_train, y_train, batch_size=batch_size, nb_epoch=nb_epoch,
|
|
|
|
validation_data=(X_test, y_test), show_accuracy=True)
|
|
|
|
score, acc = model.evaluate(X_test, y_test, batch_size=batch_size,
|
|
|
|
show_accuracy=True)
|
2015-10-23 20:19:27 +00:00
|
|
|
print('Test score:', score)
|
|
|
|
print('Test accuracy:', acc)
|