GloVe Embedding Code

Uploaded by

valachi b-boy

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

13 views3 pages

GloVe Embedding Code

Uploaded by

valachi b-boy

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 3

import pandas as pd

import numpy as np
from sklearn.metrics import confusion_matrix
from tensorflow.keras.preprocessing.text import Tokenizer
from tensorflow.keras.preprocessing.sequence import pad_sequences
from tensorflow.keras.layers import Input, Embedding, Conv1D, MaxPooling1D, LSTM,
Dense, Dropout, Concatenate
from tensorflow.keras.models import Model
from tensorflow.keras.optimizers import RMSprop
from tensorflow.keras.callbacks import EarlyStopping
import matplotlib.pyplot as plt

print('import done')

# Define hyperparameters
MAX_SEQ_LENGTH = 100
MAX_NB_WORDS = 20000
EMBEDDING_DIM = 100
FILTER_SIZES = [3, 5, 7]
NUM_FILTERS = 256
LSTM_UNITS = 256
DENSE_UNITS = 1
DROPOUT_RATE = 0.5
PATIENCE = 10

print('config done')

# Load the dataset

df =
pd.read_csv("/kaggle/input/sentiment140/training.1600000.processed.noemoticon.csv",
encoding='latin-1', header=None)
df.columns = ["sentiment", "id", "date", "query", "user", "text"]
df = df[["sentiment", "text"]]
df["sentiment"] = df["sentiment"].replace({0: "negative", 4: "positive"})
texts = df["text"].values
labels = df["sentiment"].values
labels = np.array([1 if label == "positive" else 0 for label in labels])
print(df.head(10))

# Preprocess text data

tokenizer = Tokenizer(num_words=MAX_NB_WORDS)
tokenizer.fit_on_texts(texts)
sequences = tokenizer.texts_to_sequences(texts)
word_index = tokenizer.word_index
data = pad_sequences(sequences, maxlen=MAX_SEQ_LENGTH)

# Load pre-trained word embeddings (e.g., GloVe)

embedding_dim = 100
embedding_index = {}
with open('glove.6B.100d.txt', encoding='utf-8') as f:
for line in f:
values = line.split()
word = values[0]
coefficients = np.asarray(values[1:], dtype='float32')
embedding_index[word] = coefficients

# Create embedding matrix

num_words = min(MAX_NB_WORDS, len(word_index) + 1)
embedding_matrix = np.zeros((num_words, embedding_dim))
for word, i in word_index.items():
if i >= MAX_NB_WORDS:
continue
embedding_vector = embedding_index.get(word)
if embedding_vector is not None:
embedding_matrix[i] = embedding_vector

# Define model architecture

inputs = Input(shape=(MAX_SEQ_LENGTH,))
embedding = Embedding(input_dim=num_words, output_dim=embedding_dim,
input_length=MAX_SEQ_LENGTH, weights=[embedding_matrix], trainable=False)(inputs)
conv_layers = []
for filter_size in FILTER_SIZES:
conv = Conv1D(filters=NUM_FILTERS, kernel_size=filter_size, activation='relu')
(embedding)
pool = MaxPooling1D(pool_size=MAX_SEQ_LENGTH - filter_size + 1)(conv)
conv_layers.append(pool)
concat = Concatenate()(conv_layers)
lstm = LSTM(units=LSTM_UNITS)(concat)
dropout = Dropout(rate=DROPOUT_RATE)(lstm)
outputs = Dense(units=DENSE_UNITS, activation='sigmoid')(dropout)
model = Model(inputs=inputs, outputs=outputs)
optimizer = RMSprop(learning_rate=0.001)
model.compile(optimizer=optimizer, loss='binary_crossentropy',
metrics=['accuracy'])
model.summary()

# Train the model with early stopping

es = EarlyStopping(monitor='val_accuracy', patience=PATIENCE, mode='max',
min_delta=0.01, baseline=0.85)
history = model.fit(data, labels, epochs=50, validation_split=0.3, callbacks=[es])

# Plot accuracy
plt.plot(history.history['accuracy'])
plt.plot(history.history['val_accuracy'])
plt.title('Model Accuracy')
plt.xlabel('Epoch')
plt.ylabel('Accuracy')
plt.legend(['Train', 'Validation'], loc='upper left')
plt.show()

# Make predictions on new data

new_texts = ["is upset that he can't update his Facebook by texting it... and might
cry as a result School today ...",
"@Kenichan I dived many times for the ball. Managed to save 50% The
rest go out of bounds",
"my whole body feels itchy and like its on fire",
"@nationwideclass no, it's not behaving at all. i'm mad. why am i
here? because I can't see you all o...",
"@Kwesidei not the whole crew",
"@LettyA ahh ive always wanted to see rent love the soundtrack!!",
"@FakerPattyPattz Oh dear. Were you drinking out of the forgotten
table drinks? "]
new_sequences = tokenizer.texts_to_sequences(new_texts)
new_data = pad_sequences(new_sequences, maxlen=MAX_SEQ_LENGTH)
predictions = model.predict(new_data)
# Evaluate the model
y_pred = np.round(predictions)
y_true = np.array([0, 0, 0, 0, 0, 0, 0]) # true labels of new data
cm = confusion_matrix(y_true, y_pred)
print(cm)

gpt-2 Code
No ratings yet
gpt-2 Code
2 pages
Sentiment Analysis with CNN Model
No ratings yet
Sentiment Analysis with CNN Model
2 pages
Sentiment Analysis with Word2Vec BiLSTM
No ratings yet
Sentiment Analysis with Word2Vec BiLSTM
2 pages
Sentiment Analysis Using LSTM
No ratings yet
Sentiment Analysis Using LSTM
5 pages
Sentiment Analysis Using LSTM
No ratings yet
Sentiment Analysis Using LSTM
5 pages
DL 3
No ratings yet
DL 3
6 pages
DL
No ratings yet
DL
17 pages
Import Numpy As NP
No ratings yet
Import Numpy As NP
3 pages
Sample
No ratings yet
Sample
6 pages
Code Text
No ratings yet
Code Text
4 pages
Fake News Detection with LSTM
No ratings yet
Fake News Detection with LSTM
8 pages
DL Exps
No ratings yet
DL Exps
9 pages
Movie Review Classification
No ratings yet
Movie Review Classification
5 pages
Final Code
No ratings yet
Final Code
16 pages
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
No ratings yet
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
17 pages
DL5.ipynb - Colab
No ratings yet
DL5.ipynb - Colab
3 pages
Import As Import As Import As Import As From Import From Import From Import From Import From Import From Import From Import From Import From Import
No ratings yet
Import As Import As Import As Import As From Import From Import From Import From Import From Import From Import From Import From Import From Import
8 pages
Super Visionado VSRegras
No ratings yet
Super Visionado VSRegras
6 pages
Untitled 10
No ratings yet
Untitled 10
6 pages
Sentence Embedding Code
No ratings yet
Sentence Embedding Code
9 pages
ML Assignment
No ratings yet
ML Assignment
10 pages
DL Exp-10,11,12
No ratings yet
DL Exp-10,11,12
6 pages
Case Study - Sentiment Analysis With RNNs
No ratings yet
Case Study - Sentiment Analysis With RNNs
8 pages
Emotion Detection - Merged
No ratings yet
Emotion Detection - Merged
8 pages
Hugging Face
No ratings yet
Hugging Face
1 page
Ej Stanford Dog Densenet
No ratings yet
Ej Stanford Dog Densenet
6 pages
NLP Lab Assignment - 05
No ratings yet
NLP Lab Assignment - 05
6 pages
Adobe Scan 08 Jan 2025
No ratings yet
Adobe Scan 08 Jan 2025
7 pages
DL Lab Answers Batch 2
No ratings yet
DL Lab Answers Batch 2
27 pages
Course 3 - Week 2 - Exercise - Answer - Ipynb - Colaboratory
No ratings yet
Course 3 - Week 2 - Exercise - Answer - Ipynb - Colaboratory
8 pages
CNN Ise
No ratings yet
CNN Ise
5 pages
Import Numpy As NP
No ratings yet
Import Numpy As NP
5 pages
NNProject t2
No ratings yet
NNProject t2
9 pages
Assignment10 4
100% (1)
Assignment10 4
3 pages
Computer Vision Lab Guide
No ratings yet
Computer Vision Lab Guide
120 pages
Hybrid CNN LSTM
No ratings yet
Hybrid CNN LSTM
2 pages
Hand Written
No ratings yet
Hand Written
13 pages
Unit 4
No ratings yet
Unit 4
23 pages
LSTM Sentiment Analysis Guide
No ratings yet
LSTM Sentiment Analysis Guide
3 pages
NLP Transformer-Based Models Used For Sentiment Analysis: 1. BERT
No ratings yet
NLP Transformer-Based Models Used For Sentiment Analysis: 1. BERT
98 pages
CNN Model
No ratings yet
CNN Model
7 pages
Classification CNN
No ratings yet
Classification CNN
7 pages
Emotion Based Model Prediction - ANN - ESE
No ratings yet
Emotion Based Model Prediction - ANN - ESE
5 pages
Recurrent Neural Networks: Pytorch
No ratings yet
Recurrent Neural Networks: Pytorch
6 pages
ML Week10.1
No ratings yet
ML Week10.1
5 pages
Rajeek 7
No ratings yet
Rajeek 7
3 pages
Deep Learning Programs Updated
No ratings yet
Deep Learning Programs Updated
24 pages
Keras Deep Learning Cheat Sheet
No ratings yet
Keras Deep Learning Cheat Sheet
1 page
Python-Cheatsheets Merged 230118 192222
No ratings yet
Python-Cheatsheets Merged 230118 192222
22 pages
Transformer Models for Sentiment Analysis
No ratings yet
Transformer Models for Sentiment Analysis
45 pages
Ex 5
No ratings yet
Ex 5
3 pages
DL 5 Excuted
No ratings yet
DL 5 Excuted
13 pages
Import As From Import From Import From Import From Import: # Load The IMDB Dataset
No ratings yet
Import As From Import From Import From Import From Import: # Load The IMDB Dataset
6 pages
RLDL
No ratings yet
RLDL
27 pages
L2 - Basic ANN Model Building With TF-Keras
No ratings yet
L2 - Basic ANN Model Building With TF-Keras
16 pages
NNDL 1-5
No ratings yet
NNDL 1-5
18 pages
Sentimen2.ipynb - Colaboratory
No ratings yet
Sentimen2.ipynb - Colaboratory
12 pages
Exp 6,7,8
No ratings yet
Exp 6,7,8
17 pages
Binary Classification - Ipynb - Colab
No ratings yet
Binary Classification - Ipynb - Colab
5 pages
Connect Redis Using Node JS
No ratings yet
Connect Redis Using Node JS
3 pages
Gen Ed 1 and 2
No ratings yet
Gen Ed 1 and 2
84 pages
ITNE3013 Assignment Sem 2 2020 PDF
No ratings yet
ITNE3013 Assignment Sem 2 2020 PDF
4 pages
Boost 360: Elevate Your Service Business
No ratings yet
Boost 360: Elevate Your Service Business
11 pages
Movi-Fi: Motion-Robust Vital Signs Waveform Recovery Via Deep Interpreted RF Sensing
No ratings yet
Movi-Fi: Motion-Robust Vital Signs Waveform Recovery Via Deep Interpreted RF Sensing
14 pages
VPN Documentation
0% (1)
VPN Documentation
64 pages
IT Solutions for Global Businesses
No ratings yet
IT Solutions for Global Businesses
4 pages
Interprocess Communication Mechanisms: UNIT-3 Cooperating Processes
No ratings yet
Interprocess Communication Mechanisms: UNIT-3 Cooperating Processes
24 pages
8 - FDS and FS
No ratings yet
8 - FDS and FS
8 pages
Beneficiary Registration File Format
No ratings yet
Beneficiary Registration File Format
7 pages
Image Pass b1
No ratings yet
Image Pass b1
76 pages
Tarana G1 vs 4G/5G for Fixed Wireless
No ratings yet
Tarana G1 vs 4G/5G for Fixed Wireless
11 pages
Kubernetes Notes
No ratings yet
Kubernetes Notes
17 pages
ICT Lab: Search Engines & Tools
No ratings yet
ICT Lab: Search Engines & Tools
10 pages
Micron Employment Privacy Notice 2023 English RA
No ratings yet
Micron Employment Privacy Notice 2023 English RA
22 pages
Jntuh Results - Academic Result
No ratings yet
Jntuh Results - Academic Result
2 pages
Data Base Programming
No ratings yet
Data Base Programming
12 pages
Temparature Mapping Protocol
100% (2)
Temparature Mapping Protocol
8 pages
GP Project Asm 510-2
No ratings yet
GP Project Asm 510-2
26 pages
04 PRMGT MCQ 2023 - TEST (Final - Class Test) (Copy)
No ratings yet
04 PRMGT MCQ 2023 - TEST (Final - Class Test) (Copy)
19 pages
Anm Full
No ratings yet
Anm Full
100 pages
DOC1087 GB - P142-L-NUT-033-B - UserManual - dBLexd
No ratings yet
DOC1087 GB - P142-L-NUT-033-B - UserManual - dBLexd
71 pages
Dhruvi Resume
No ratings yet
Dhruvi Resume
1 page
Lab Manual 4340704 IWD
No ratings yet
Lab Manual 4340704 IWD
151 pages
PowerDash-Logistics Diagnostics Tool
No ratings yet
PowerDash-Logistics Diagnostics Tool
15 pages
Itu - H.323
No ratings yet
Itu - H.323
108 pages
Java SpringBoot 50 Interview
No ratings yet
Java SpringBoot 50 Interview
15 pages
Part List DCP t500w
No ratings yet
Part List DCP t500w
29 pages
Grafis 1
No ratings yet
Grafis 1
11 pages
Yokogawa - AE PH Sensor FU20
No ratings yet
Yokogawa - AE PH Sensor FU20
2 pages

GloVe Embedding Code

Uploaded by

GloVe Embedding Code

Uploaded by

import pandas as pd

# Load the dataset

# Preprocess text data

# Load pre-trained word embeddings (e.g., GloVe)

# Create embedding matrix

# Define model architecture

# Train the model with early stopping

# Make predictions on new data

You might also like