0% found this document useful (0 votes)

59 views4 pages

Assignment 10 2

The document loads Keras and other Python libraries for building and evaluating a neural network model for sentiment analysis on the IMDB movie reviews dataset. It preprocesses the data, builds an embedding and dense layer model, trains it for 10 epochs, evaluates accuracy on validation data during training, and finally evaluates the saved model on held-out test data.

Uploaded by

dash

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

59 views4 pages

Assignment 10 2

Uploaded by

dash

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 4

10.

2
In [1]:
from keras.preprocessing.text import Tokenizer

from keras.preprocessing.sequence import pad_sequences

import numpy as np

import matplotlib.pyplot as plt

from pathlib import Path

from keras.models import Sequential

from keras.layers import Embedding, Flatten, Dense

import os

from contextlib import redirect_stdout

import time

start_time = time.time()

In [8]:
results_dir = Path('results').joinpath('model_1')

results_dir.mkdir(parents=True, exist_ok=True)

# path for IMDB data

imdb_dir = Path('/home/desktop/dsc650/data/external/imdb/aclImdb/')
test_dir = os.path.join(imdb_dir, 'test')

train_dir = os.path.join(imdb_dir, 'train')

In [9]:
training_samples = 200

maxlen = 100 # cuts off review after 100 words

max_words = 1000 # Considers only the top 1000 words in the dataset
embedding_dim = 100

training_samples = 200 # trains on 200 samples

validation_samples = 10000 # validates on 10000 samples

In [10]:
labels = []

texts = []

for label_type in ['neg', 'pos']:

dir_name = os.path.join(test_dir, label_type)

for fname in sorted(os.listdir(dir_name)):

if fname[-4:] == '.txt':

f = open(os.path.join(dir_name, fname), encoding="utf8")

texts.append(f.read())

f.close()

if label_type == 'neg':

labels.append(0)

else:

labels.append(1)

In [11]:
tokenizer = Tokenizer(num_words=max_words)

tokenizer.fit_on_texts(texts)

sequences = tokenizer.texts_to_sequences(texts)

word_index = tokenizer.word_index
print('Found %s unique tokens.' % len(word_index))

data = pad_sequences(sequences, maxlen=maxlen)

labels = np.asarray(labels)

print('Shape of data tensor:', data.shape)

print('Shape of label tensor:', labels.shape)

Found 87393 unique tokens.

Shape of data tensor: (25000, 100)

Loading [MathJax]/jax/output/CommonHTML/fonts/TeX/fontdata.js
Shape of label tensor: (25000,)

In [12]:
indices = np.arange(data.shape[0])

np.random.shuffle(indices)

data = data[indices]

labels = labels[indices]

x_train = data[:training_samples]
y_train = labels[:training_samples]

x_val = data[training_samples: training_samples + validation_samples]

y_val = labels[training_samples: training_samples + validation_samples]

In [13]:
# from page 191 Listing 6.12

model = Sequential()

model.add(Embedding(max_words, embedding_dim, input_length=maxlen))

model.add(Flatten())

model.add(Dense(32,activation='relu'))

model.add(Dense(1, activation='sigmoid'))

In [14]:
# Save the summary to file

summary_file = results_dir.joinpath('Assignment_10.2_ModelSummary.txt')

with open(summary_file, 'w') as f:

with redirect_stdout(f):

model.summary()

# from page 192

model.compile(optimizer='rmsprop', loss='binary_crossentropy', metrics=['acc'])

history=model.fit(x_train, y_train, epochs=10, batch_size=32,validation_data=(x_val,

result_model_file = results_dir.joinpath('pre_trained_glove_model.h5')

model.save_weights(result_model_file)

Epoch 1/10

7/7 [==============================] - 1s 120ms/step - loss: 0.6966 - acc: 0.4703 -

val_loss: 0.6928 - val_acc: 0.5115
Epoch 2/10

7/7 [==============================] - 1s 101ms/step - loss: 0.5752 - acc: 0.9481 -

val_loss: 0.6933 - val_acc: 0.5143
Epoch 3/10

7/7 [==============================] - 1s 96ms/step - loss: 0.4203 - acc: 0.9792 - v

al_loss: 0.6991 - val_acc: 0.5142

Epoch 4/10

7/7 [==============================] - 1s 104ms/step - loss: 0.2528 - acc: 0.9674 -

val_loss: 0.7005 - val_acc: 0.5265
Epoch 5/10

7/7 [==============================] - 1s 99ms/step - loss: 0.1495 - acc: 0.9931 - v

al_loss: 0.7039 - val_acc: 0.5273

Epoch 6/10

7/7 [==============================] - 1s 99ms/step - loss: 0.0822 - acc: 0.9963 - v

al_loss: 0.7383 - val_acc: 0.5208

Epoch 7/10

7/7 [==============================] - 1s 100ms/step - loss: 0.0541 - acc: 1.0000 -

val_loss: 0.7206 - val_acc: 0.5307
Epoch 8/10

7/7 [==============================] - 1s 99ms/step - loss: 0.0295 - acc: 1.0000 - v

al_loss: 0.7405 - val_acc: 0.5246

Epoch 9/10

7/7 [==============================] - 1s 101ms/step - loss: 0.0179 - acc: 1.0000 -

val_loss: 0.7399 - val_acc: 0.5295
Epoch 10/10

7/7 [==============================] - 1s 101ms/step - loss: 0.0099 - acc: 1.0000 -

val_loss: 0.7519 - val_acc: 0.5313

In [15]:
Loading [MathJax]/jax/output/CommonHTML/fonts/TeX/fontdata.js
# Plots

acc = history.history['acc']

val_acc = history.history['val_acc']

loss = history.history['loss']

val_loss = history.history['val_loss']

epochs = range(1, len(acc) + 1)

plt.plot(epochs, acc, 'bo', label='Training acc')

plt.plot(epochs, val_acc, 'b', label='Validation acc')

plt.title('Training and validation accuracy')

plt.legend()

plt.figure()

plt.plot(epochs, loss, 'bo', label='Training loss')

plt.plot(epochs, val_loss, 'b', label='Validation loss')

plt.title('Training and validation loss')

plt.legend()

img_file = results_dir.joinpath('Assignment_10.2_Model Accuracy Validation.png')

plt.savefig(img_file)

plt.show()

In [16]:
labels=[]

texts=[]

for label_type in ['neg', 'pos']:

dir_name = os.path.join(test_dir, label_type)

for fname in sorted(os.listdir(dir_name)):

if fname[-4:] == '.txt':

f = open(os.path.join(dir_name, fname), encoding="utf8")

texts.append(f.read())

f.close()

if label_type == 'neg':

labels.append(0)

Loading [MathJax]/jax/output/CommonHTML/fonts/TeX/fontdata.js
else:

labels.append(1)

In [17]:
sequence = tokenizer.texts_to_sequences(texts)

x_test = pad_sequences(sequences, maxlen=maxlen)

y_test = np.asarray(labels)

model.load_weights(result_model_file)

eval = model.evaluate(x_test, y_test)

print("")

print(eval)

print("Complete: --- %s seconds has passed ---" % (time.time() - start_time))

782/782 [==============================] - 2s 2ms/step - loss: 0.7500 - acc: 0.5329

[0.750030517578125, 0.5329200029373169]

Complete: --- 453.8152759075165 seconds has passed ---

In [ ]:

Loading [MathJax]/jax/output/CommonHTML/fonts/TeX/fontdata.js

Presentation Mikrotik
No ratings yet
Presentation Mikrotik
68 pages
Assignment10 4
100% (1)
Assignment10 4
3 pages
Binary Classification - Ipynb - Colab
No ratings yet
Binary Classification - Ipynb - Colab
5 pages
Dl 5 Excuted
No ratings yet
Dl 5 Excuted
13 pages
Sample
No ratings yet
Sample
6 pages
vertopal.com_movie review classification
No ratings yet
vertopal.com_movie review classification
5 pages
Apex For Bres 1
No ratings yet
Apex For Bres 1
6 pages
Deep Learning Programs Updated
No ratings yet
Deep Learning Programs Updated
24 pages
vertopal.com_8-12
No ratings yet
vertopal.com_8-12
6 pages
Exp 6,7,8
No ratings yet
Exp 6,7,8
17 pages
Deep Learning Manual (1)
No ratings yet
Deep Learning Manual (1)
53 pages
Finding Similar Fashion Products With Their Links
No ratings yet
Finding Similar Fashion Products With Their Links
19 pages
Downloaded by R GAYATHRI (R.gayathri@aalimec - Ac.in)
No ratings yet
Downloaded by R GAYATHRI (R.gayathri@aalimec - Ac.in)
56 pages
DL5.ipynb - Colab
No ratings yet
DL5.ipynb - Colab
3 pages
AD3511 - Deep Learning Lab Manual - - Copy
No ratings yet
AD3511 - Deep Learning Lab Manual - - Copy
61 pages
dl_5 excuted
No ratings yet
dl_5 excuted
13 pages
Integer-Encoding-Simplernn - Ipynb - Colaboratory
No ratings yet
Integer-Encoding-Simplernn - Ipynb - Colaboratory
4 pages
ML PPT G3
No ratings yet
ML PPT G3
15 pages
DL
No ratings yet
DL
17 pages
Deep Learning Lab Manual
No ratings yet
Deep Learning Lab Manual
46 pages
Design A Neural Network For Classifying Movie Reviews
No ratings yet
Design A Neural Network For Classifying Movie Reviews
5 pages
IMDB - Colaboratory
No ratings yet
IMDB - Colaboratory
10 pages
vertopal.com_HandWritten
No ratings yet
vertopal.com_HandWritten
13 pages
Deep Learning Lab Manual
No ratings yet
Deep Learning Lab Manual
88 pages
NNDL 7&8 Programs
No ratings yet
NNDL 7&8 Programs
7 pages
DEEP LEARNING MANUAL Final
No ratings yet
DEEP LEARNING MANUAL Final
14 pages
dl exps
No ratings yet
dl exps
9 pages
Course 3 - Week 2 - Exercise - Answer - Ipynb - Colaboratory
No ratings yet
Course 3 - Week 2 - Exercise - Answer - Ipynb - Colaboratory
8 pages
Dl lab answers batch 2
No ratings yet
Dl lab answers batch 2
27 pages
Content: From Import Import As Import Import Import As
No ratings yet
Content: From Import Import As Import Import Import As
8 pages
Chapter02 Mathematical-Building-Blocks
No ratings yet
Chapter02 Mathematical-Building-Blocks
9 pages
DL_20-WordEmbeddings.ipynb - Colab
No ratings yet
DL_20-WordEmbeddings.ipynb - Colab
6 pages
program 5
No ratings yet
program 5
3 pages
nndl2 (2)
No ratings yet
nndl2 (2)
67 pages
748747019-ad3511-deep-learning-lab-manual-iii-yearjnn (1)-1
No ratings yet
748747019-ad3511-deep-learning-lab-manual-iii-yearjnn (1)-1
51 pages
dl_6
No ratings yet
dl_6
5 pages
Experiment 3 (D, E) (Embedding) (Plotting) PDF
No ratings yet
Experiment 3 (D, E) (Embedding) (Plotting) PDF
8 pages
Cv prince
No ratings yet
Cv prince
120 pages
word2vec
No ratings yet
word2vec
3 pages
Notebook - Tensorflow Keras
No ratings yet
Notebook - Tensorflow Keras
25 pages
Dl Prac03IT
No ratings yet
Dl Prac03IT
7 pages
ass_3
No ratings yet
ass_3
5 pages
deep learning lab
No ratings yet
deep learning lab
26 pages
Ex_5
No ratings yet
Ex_5
3 pages
Sample code
No ratings yet
Sample code
8 pages
Image Caption2
No ratings yet
Image Caption2
9 pages
CVcode
No ratings yet
CVcode
4 pages
Assignment 2.4.1 Multiclass Classification
No ratings yet
Assignment 2.4.1 Multiclass Classification
5 pages
Dl Lab Manual
No ratings yet
Dl Lab Manual
18 pages
Hand Written
No ratings yet
Hand Written
5 pages
Vertopal.com Wild Fire Cnn Accuracy 95 (1)
No ratings yet
Vertopal.com Wild Fire Cnn Accuracy 95 (1)
15 pages
EncoderDecoderSeq2Seq DeepLSTM
No ratings yet
EncoderDecoderSeq2Seq DeepLSTM
7 pages
S. NO. Title of The Experiments Page No
No ratings yet
S. NO. Title of The Experiments Page No
11 pages
Labpractice 2
100% (2)
Labpractice 2
29 pages
DL2 - Jupyter Notebook
No ratings yet
DL2 - Jupyter Notebook
5 pages
Vertopal.com HW4ML Project Code
No ratings yet
Vertopal.com HW4ML Project Code
24 pages
Image Classification of An American Sign Language Dataset: Objectives
No ratings yet
Image Classification of An American Sign Language Dataset: Objectives
11 pages
assignment no 2
No ratings yet
assignment no 2
3 pages
Practical No10
No ratings yet
Practical No10
4 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
The Essential R Reference
From Everand
The Essential R Reference
Mark Gardener
No ratings yet
Assignment 6.3
No ratings yet
Assignment 6.3
2 pages
Employee Warning Letter 14
No ratings yet
Employee Warning Letter 14
1 page
Math 110 Activity 6: Open The CPI File To Use For This Activity. 1. Converting To Constant Dollars
No ratings yet
Math 110 Activity 6: Open The CPI File To Use For This Activity. 1. Converting To Constant Dollars
3 pages
Visualization Analysis Pca
No ratings yet
Visualization Analysis Pca
24 pages
Data Analysis Project News Article Grading Criteria and Rubric
No ratings yet
Data Analysis Project News Article Grading Criteria and Rubric
1 page
Ieee Pid Control System Analysis Design and Technology
No ratings yet
Ieee Pid Control System Analysis Design and Technology
18 pages
The Vehicle Steer by Wire Control System by Implementing PID Controller
No ratings yet
The Vehicle Steer by Wire Control System by Implementing PID Controller
5 pages
Front Wheel Angle Control of Steering by Wire System Based On Fuzzy Adaptive PID Algorithm
No ratings yet
Front Wheel Angle Control of Steering by Wire System Based On Fuzzy Adaptive PID Algorithm
7 pages
The Design of A Controller For The Steer-by-Wire System: Key Words
No ratings yet
The Design of A Controller For The Steer-by-Wire System: Key Words
12 pages
Front Wheel Angle Control of Steering by Wire System Based On Fuzzy Adaptive PID Algorithm
No ratings yet
Front Wheel Angle Control of Steering by Wire System Based On Fuzzy Adaptive PID Algorithm
7 pages
Free Tiktok Likes Trial - GM835599320
No ratings yet
Free Tiktok Likes Trial - GM835599320
2 pages
Systemverilog-Module3-Dec2021
No ratings yet
Systemverilog-Module3-Dec2021
68 pages
Virtual Whiteboard Using Hand Gestures
No ratings yet
Virtual Whiteboard Using Hand Gestures
42 pages
Advanced Eap7 Cheat Sheet r2v1
No ratings yet
Advanced Eap7 Cheat Sheet r2v1
8 pages
Computer Applications - Notes
100% (1)
Computer Applications - Notes
25 pages
FreeBSD Handbook Introduction (Online Edition)
No ratings yet
FreeBSD Handbook Introduction (Online Edition)
11 pages
Anil Resume Sap-Abap PDF
No ratings yet
Anil Resume Sap-Abap PDF
2 pages
BDA Question bank with solutions
No ratings yet
BDA Question bank with solutions
88 pages
LAP #1
No ratings yet
LAP #1
11 pages
p44 Norman 1
100% (7)
p44 Norman 1
2 pages
Expressed in Terms of Parameter
No ratings yet
Expressed in Terms of Parameter
4 pages
ALV Reports Using FM
No ratings yet
ALV Reports Using FM
32 pages
Successfactors Employee Central Time Account Accrual
No ratings yet
Successfactors Employee Central Time Account Accrual
29 pages
ConceptDraw PRO 11 Reference Mac
No ratings yet
ConceptDraw PRO 11 Reference Mac
122 pages
Sheetal Project Report
No ratings yet
Sheetal Project Report
68 pages
SyllabusPDF 160261 16663629593975BF54
No ratings yet
SyllabusPDF 160261 16663629593975BF54
9 pages
Secure Access Labs (FAP+FG) V5.6
No ratings yet
Secure Access Labs (FAP+FG) V5.6
59 pages
Hexadecimal Numbers: Mr. Mcbrien Tej2O
No ratings yet
Hexadecimal Numbers: Mr. Mcbrien Tej2O
51 pages
Narrative Report Mental Health
No ratings yet
Narrative Report Mental Health
9 pages
Pci DSS:: What Every Dba Needs To Know
No ratings yet
Pci DSS:: What Every Dba Needs To Know
6 pages
Administering Contact Recorder en
No ratings yet
Administering Contact Recorder en
84 pages
CSS Selectors & Units Cheat Sheet Web Dev Topics Learn The Web
No ratings yet
CSS Selectors & Units Cheat Sheet Web Dev Topics Learn The Web
8 pages
Profiles How To
No ratings yet
Profiles How To
11 pages
Druck Digital Test Gauge: Measurement & Control Solutions
No ratings yet
Druck Digital Test Gauge: Measurement & Control Solutions
4 pages
CJICT Azeez Digital+Twins
No ratings yet
CJICT Azeez Digital+Twins
15 pages
Milestone 3 IT600
No ratings yet
Milestone 3 IT600
4 pages
The Intune Best Practices Checklist
No ratings yet
The Intune Best Practices Checklist
36 pages
C++ Project in + Theory
0% (1)
C++ Project in + Theory
6 pages
Macrium Reflect Patch Log
No ratings yet
Macrium Reflect Patch Log
5 pages

Assignment 10 2

Uploaded by

Assignment 10 2

Uploaded by

10.

from keras.preprocessing.sequence import pad_sequences

import matplotlib.pyplot as plt

from pathlib import Path

from keras.models import Sequential

from keras.layers import Embedding, Flatten, Dense

from contextlib import redirect_stdout

# path for IMDB data

train_dir = os.path.join(imdb_dir, 'train')

maxlen = 100 # cuts off review after 100 words

training_samples = 200 # trains on 200 samples

validation_samples = 10000 # validates on 10000 samples

for label_type in ['neg', 'pos']:

dir_name = os.path.join(test_dir, label_type)

for fname in sorted(os.listdir(dir_name)):

f = open(os.path.join(dir_name, fname), encoding="utf8")

data = pad_sequences(sequences, maxlen=maxlen)

print('Shape of data tensor:', data.shape)

print('Shape of label tensor:', labels.shape)

Found 87393 unique tokens.

Shape of data tensor: (25000, 100)

x_val = data[training_samples: training_samples + validation_samples]

y_val = labels[training_samples: training_samples + validation_samples]

model.add(Embedding(max_words, embedding_dim, input_length=maxlen))

with open(summary_file, 'w') as f:

# from page 192

model.compile(optimizer='rmsprop', loss='binary_crossentropy', metrics=['acc'])

history=model.fit(x_train, y_train, epochs=10, batch_size=32,validation_data=(x_val,

7/7 [==============================] - 1s 120ms/step - loss: 0.6966 - acc: 0.4703 -

7/7 [==============================] - 1s 101ms/step - loss: 0.5752 - acc: 0.9481 -

7/7 [==============================] - 1s 96ms/step - loss: 0.4203 - acc: 0.9792 - v

7/7 [==============================] - 1s 104ms/step - loss: 0.2528 - acc: 0.9674 -

7/7 [==============================] - 1s 99ms/step - loss: 0.1495 - acc: 0.9931 - v

7/7 [==============================] - 1s 99ms/step - loss: 0.0822 - acc: 0.9963 - v

7/7 [==============================] - 1s 100ms/step - loss: 0.0541 - acc: 1.0000 -

7/7 [==============================] - 1s 99ms/step - loss: 0.0295 - acc: 1.0000 - v

7/7 [==============================] - 1s 101ms/step - loss: 0.0179 - acc: 1.0000 -

7/7 [==============================] - 1s 101ms/step - loss: 0.0099 - acc: 1.0000 -

epochs = range(1, len(acc) + 1)

plt.plot(epochs, acc, 'bo', label='Training acc')

plt.plot(epochs, val_acc, 'b', label='Validation acc')

plt.title('Training and validation accuracy')

plt.plot(epochs, loss, 'bo', label='Training loss')

plt.plot(epochs, val_loss, 'b', label='Validation loss')

plt.title('Training and validation loss')

img_file = results_dir.joinpath('Assignment_10.2_Model Accuracy Validation.png')

for label_type in ['neg', 'pos']:

dir_name = os.path.join(test_dir, label_type)

for fname in sorted(os.listdir(dir_name)):

f = open(os.path.join(dir_name, fname), encoding="utf8")

x_test = pad_sequences(sequences, maxlen=maxlen)

eval = model.evaluate(x_test, y_test)

print("Complete: --- %s seconds has passed ---" % (time.time() - start_time))

782/782 [==============================] - 2s 2ms/step - loss: 0.7500 - acc: 0.5329

Complete: --- 453.8152759075165 seconds has passed ---

You might also like