stress_asignment/workbench.py

# -*- coding: utf-8 -*-
from __future__ import unicode_literals
# text in Western (Windows 1252)

import pickle
import numpy as np
from keras import optimizers
from keras.models import Model
from keras.layers import Dense, Dropout, Input
from keras.layers.merge import concatenate
from keras.layers.convolutional import Conv1D
from keras.layers.convolutional import MaxPooling1D
from keras.layers import Flatten
# from keras import backend as Input
np.random.seed(7)

# get_ipython().magic('run ../../../prepare_data.py')

# import sys
# # sys.path.insert(0, '../../../')
# sys.path.insert(0, '/home/luka/Developement/accetuation/')
from prepare_data import *


# X_train, X_other_features_train, y_train, X_validate, X_other_features_validate, y_validate = generate_full_matrix_inputs()
# save_inputs('../../internal_representations/inputs/shuffeled_matrix_train_inputs_other_features_output_11.h5', X_train, y_train, other_features = X_other_features_train)
# save_inputs('../../internal_representations/inputs/shuffeled_matrix_validate_inputs_other_features_output_11.h5', X_validate, y_validate,  other_features = X_other_features_validate)
# X_train, X_other_features_train, y_train = load_inputs('cnn/internal_representations/inputs/shuffeled_matrix_train_inputs_other_features_output_11.h5', other_features=True)
# X_validate, X_other_features_validate, y_validate = load_inputs('cnn/internal_representations/inputs/shuffeled_matrix_validate_inputs_other_features_output_11.h5', other_features=True)
# letters
# data = Data('l', save_generated_data=False, number_of_syllables=True)

# syllabled letters
data = Data('s', save_generated_data=False, accent_classification=True)
data.generate_data('letters_word_accetuation_train',
                   'letters_word_accetuation_test',
                   'letters_word_accetuation_validate', content_name='SlovarIJS_BESEDE_utf8.lex',
                      content_shuffle_vector='content_shuffle_vector', shuffle_vector='shuffle_vector',
                      inputs_location='', content_location='')

# concatenate test and train data
# data.x_train = np.concatenate((data.x_train, data.x_test), axis=0)
# data.x_other_features_train = np.concatenate((data.x_other_features_train, data.x_other_features_test), axis=0)
# data.y_train = np.concatenate((data.y_train, data.y_test), axis=0)

# concatenate all data
data.x_train = np.concatenate((data.x_train, data.x_test, data.x_validate), axis=0)
data.x_other_features_train = np.concatenate((data.x_other_features_train, data.x_other_features_test, data.x_other_features_validate), axis=0)
data.y_train = np.concatenate((data.y_train, data.y_test,  data.y_validate), axis=0)

num_examples = len(data.x_train)  # training set size
nn_output_dim = 13
nn_hdim = 516
batch_size = 16
# actual_epoch = 1
actual_epoch = 20
# num_fake_epoch = 2
num_fake_epoch = 20

# letters
# conv_input_shape=(23, 36)

# syllabled letters
# conv_input_shape=(10, 252)

# syllables
conv_input_shape=(10, 5168)


# othr_input = (140, )
othr_input = (150, )

conv_input = Input(shape=conv_input_shape, name='conv_input')
# letters
# x_conv = Conv1D(115, (3), padding='same', activation='relu')(conv_input)
# x_conv = Conv1D(46, (3), padding='same', activation='relu')(x_conv)

# syllabled letters
x_conv = Conv1D(200, (2), padding='same', activation='relu')(conv_input)
x_conv = MaxPooling1D(pool_size=2)(x_conv)
x_conv = Flatten()(x_conv)

othr_input = Input(shape=othr_input, name='othr_input')

x = concatenate([x_conv, othr_input])
# x = Dense(1024, input_dim=(516 + 256), activation='relu')(x)
x = Dense(256, activation='relu')(x)
x = Dropout(0.3)(x)
x = Dense(256, activation='relu')(x)
x = Dropout(0.3)(x)
x = Dense(256, activation='relu')(x)
x = Dropout(0.3)(x)
x = Dense(nn_output_dim, activation='sigmoid')(x)


model = Model(inputs=[conv_input, othr_input], outputs=x)
opt = optimizers.Adam(lr=1E-4, beta_1=0.9, beta_2=0.999, epsilon=1e-08)
model.compile(loss='binary_crossentropy', optimizer=opt, metrics=[actual_accuracy,])
# model.compile(loss='mean_squared_error', optimizer='adam', metrics=['accuracy'])


history = model.fit_generator(data.generator('train', batch_size, content_name='SlovarIJS_BESEDE_utf8.lex', content_location=''),
                              data.x_train.shape[0]/(batch_size * num_fake_epoch),
                              epochs=actual_epoch*num_fake_epoch,
                              verbose=2
                              )

name = '40_epoch'
model.save(name + '.h5')
output = open(name + '_history.pkl', 'wb')
pickle.dump(history.history, output)
output.close()
Moved some things 2017-07-04 08:28:27 +00:00			`# -- coding: utf-8 --`
			`from __future__ import unicode_literals`
			`# text in Western (Windows 1252)`

Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00			`import pickle`
Moved some things 2017-07-04 08:28:27 +00:00			`import numpy as np`
Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00			`from keras import optimizers`
			`from keras.models import Model`
			`from keras.layers import Dense, Dropout, Input`
Moved some things 2017-07-04 08:28:27 +00:00			`from keras.layers.merge import concatenate`
			`from keras.layers.convolutional import Conv1D`
			`from keras.layers.convolutional import MaxPooling1D`
			`from keras.layers import Flatten`
Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00			`# from keras import backend as Input`
Moved some things 2017-07-04 08:28:27 +00:00			`np.random.seed(7)`

			`# get_ipython().magic('run ../../../prepare_data.py')`

			`# import sys`
			`# # sys.path.insert(0, '../../../')`
			`# sys.path.insert(0, '/home/luka/Developement/accetuation/')`
			`from prepare_data import *`


			`# X_train, X_other_features_train, y_train, X_validate, X_other_features_validate, y_validate = generate_full_matrix_inputs()`
			`# save_inputs('../../internal_representations/inputs/shuffeled_matrix_train_inputs_other_features_output_11.h5', X_train, y_train, other_features = X_other_features_train)`
			`# save_inputs('../../internal_representations/inputs/shuffeled_matrix_validate_inputs_other_features_output_11.h5', X_validate, y_validate, other_features = X_other_features_validate)`
Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00			`# X_train, X_other_features_train, y_train = load_inputs('cnn/internal_representations/inputs/shuffeled_matrix_train_inputs_other_features_output_11.h5', other_features=True)`
			`# X_validate, X_other_features_validate, y_validate = load_inputs('cnn/internal_representations/inputs/shuffeled_matrix_validate_inputs_other_features_output_11.h5', other_features=True)`
Added multiple results and created working grid settings and scripts 2017-08-29 18:06:59 +00:00			`# letters`
			`# data = Data('l', save_generated_data=False, number_of_syllables=True)`

			`# syllabled letters`
Added multiple results and error analysis 2017-09-07 17:32:36 +00:00			`data = Data('s', save_generated_data=False, accent_classification=True)`
Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00			`data.generate_data('letters_word_accetuation_train',`
			`'letters_word_accetuation_test',`
			`'letters_word_accetuation_validate', content_name='SlovarIJS_BESEDE_utf8.lex',`
			`content_shuffle_vector='content_shuffle_vector', shuffle_vector='shuffle_vector',`
			`inputs_location='', content_location='')`

Added multiple results and error analysis 2017-09-07 17:32:36 +00:00			`# concatenate test and train data`
			`# data.x_train = np.concatenate((data.x_train, data.x_test), axis=0)`
			`# data.x_other_features_train = np.concatenate((data.x_other_features_train, data.x_other_features_test), axis=0)`
			`# data.y_train = np.concatenate((data.y_train, data.y_test), axis=0)`

			`# concatenate all data`
			`data.x_train = np.concatenate((data.x_train, data.x_test, data.x_validate), axis=0)`
			`data.x_other_features_train = np.concatenate((data.x_other_features_train, data.x_other_features_test, data.x_other_features_validate), axis=0)`
			`data.y_train = np.concatenate((data.y_train, data.y_test, data.y_validate), axis=0)`
Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00
			`num_examples = len(data.x_train) # training set size`
Added multiple results and created working grid settings and scripts 2017-08-29 18:06:59 +00:00			`nn_output_dim = 13`
Moved some things 2017-07-04 08:28:27 +00:00			`nn_hdim = 516`
Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00			`batch_size = 16`
			`# actual_epoch = 1`
Added multiple results and error analysis 2017-09-07 17:32:36 +00:00			`actual_epoch = 20`
Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00			`# num_fake_epoch = 2`
			`num_fake_epoch = 20`

Added multiple results and created working grid settings and scripts 2017-08-29 18:06:59 +00:00			`# letters`
Added multiple results and error analysis 2017-09-07 17:32:36 +00:00			`# conv_input_shape=(23, 36)`
Added multiple results and created working grid settings and scripts 2017-08-29 18:06:59 +00:00
			`# syllabled letters`
Added multiple results and error analysis 2017-09-07 17:32:36 +00:00			`# conv_input_shape=(10, 252)`

			`# syllables`
			`conv_input_shape=(10, 5168)`
Added multiple results and created working grid settings and scripts 2017-08-29 18:06:59 +00:00

			`# othr_input = (140, )`
			`othr_input = (150, )`
Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00
			`conv_input = Input(shape=conv_input_shape, name='conv_input')`
Added multiple results and created working grid settings and scripts 2017-08-29 18:06:59 +00:00			`# letters`
Added multiple results and error analysis 2017-09-07 17:32:36 +00:00			`# x_conv = Conv1D(115, (3), padding='same', activation='relu')(conv_input)`
			`# x_conv = Conv1D(46, (3), padding='same', activation='relu')(x_conv)`
Added multiple results and created working grid settings and scripts 2017-08-29 18:06:59 +00:00
			`# syllabled letters`
Added multiple results and error analysis 2017-09-07 17:32:36 +00:00			`x_conv = Conv1D(200, (2), padding='same', activation='relu')(conv_input)`
Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00			`x_conv = MaxPooling1D(pool_size=2)(x_conv)`
			`x_conv = Flatten()(x_conv)`

			`othr_input = Input(shape=othr_input, name='othr_input')`

			`x = concatenate([x_conv, othr_input])`
			`# x = Dense(1024, input_dim=(516 + 256), activation='relu')(x)`
			`x = Dense(256, activation='relu')(x)`
			`x = Dropout(0.3)(x)`
Added multiple results and error analysis 2017-09-07 17:32:36 +00:00			`x = Dense(256, activation='relu')(x)`
Added multiple results and created working grid settings and scripts 2017-08-29 18:06:59 +00:00			`x = Dropout(0.3)(x)`
Added multiple results and error analysis 2017-09-07 17:32:36 +00:00			`x = Dense(256, activation='relu')(x)`
Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00			`x = Dropout(0.3)(x)`
			`x = Dense(nn_output_dim, activation='sigmoid')(x)`
Moved some things 2017-07-04 08:28:27 +00:00



Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00			`model = Model(inputs=[conv_input, othr_input], outputs=x)`
			`opt = optimizers.Adam(lr=1E-4, beta_1=0.9, beta_2=0.999, epsilon=1e-08)`
			`model.compile(loss='binary_crossentropy', optimizer=opt, metrics=[actual_accuracy,])`
			`# model.compile(loss='mean_squared_error', optimizer='adam', metrics=['accuracy'])`
Moved some things 2017-07-04 08:28:27 +00:00

Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00			`history = model.fit_generator(data.generator('train', batch_size, content_name='SlovarIJS_BESEDE_utf8.lex', content_location=''),`
			`data.x_train.shape[0]/(batch_size * num_fake_epoch),`
			`epochs=actual_epoch*num_fake_epoch,`
Added some results 2017-08-21 07:30:14 +00:00			`verbose=2`
Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00			`)`
Moved some things 2017-07-04 08:28:27 +00:00
Added some results 2017-08-21 07:30:14 +00:00			`name = '40_epoch'`
Added num of letters to x_other_features 2017-08-18 17:08:42 +00:00			`model.save(name + '.h5')`
			`output = open(name + '_history.pkl', 'wb')`
			`pickle.dump(history.history, output)`
			`output.close()`