gpt-2 Code

Uploaded by

valachi b-boy

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

17 views2 pages

gpt-2 Code

Uploaded by

valachi b-boy

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 2

import pandas as pd

import numpy as np
import matplotlib.pyplot as plt
import torch
from sklearn.metrics import confusion_matrix
from tensorflow.keras.preprocessing.sequence import pad_sequences
from tensorflow.keras.layers import Input, Embedding, Conv1D, MaxPooling1D, GRU,
Dense, Dropout, Concatenate
from tensorflow.keras.models import Model
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.callbacks import EarlyStopping
from transformers import GPT2Tokenizer, GPT2Model

print('import done')

# Define hyperparameters
MAX_SEQ_LENGTH = 100
MAX_NB_WORDS = 20000
EMBEDDING_DIM = 100
FILTER_SIZES = [3, 5, 7]
NUM_FILTERS = 256
GRU_UNITS = 256
DENSE_UNITS = 1
DROPOUT_RATE = 0.8
print('config done')

# Load the dataset

df =
pd.read_csv("/kaggle/input/sentiment140/training.1600000.processed.noemoticon.csv",
encoding='latin-1',
header=None)
df.columns = ["sentiment", "id", "date", "query", "user", "text"]
df = df[["sentiment", "text"]]
df["sentiment"] = df["sentiment"].replace({0: "negative", 4: "positive"})
texts = df["text"].values
labels = df["sentiment"].values
labels = np.array([1 if label == "positive" else 0 for label in labels])
print(df.head(10))

# Preprocess text data

tokenizer = GPT2Tokenizer.from_pretrained("gpt2")
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
gpt_model = GPT2Model.from_pretrained("gpt2").to(device)

def extract_gpt_features(text):
inputs = tokenizer.encode_plus(text, add_special_tokens=True,
return_tensors="pt")
inputs = inputs.to(device)

with torch.no_grad():
outputs = gpt_model(**inputs)[0]

features = outputs[:, 0, :].squeeze(0).cpu().numpy()

return features

sequences = np.array([extract_gpt_features(text) for text in texts])

word_index = None # We don't need word index for GPT-based features
data = pad_sequences(sequences, maxlen=MAX_SEQ_LENGTH)
# Define model architecture
inputs = Input(shape=(MAX_SEQ_LENGTH,))
embedding = Embedding(input_dim=len(word_index) + 1, output_dim=EMBEDDING_DIM,
input_length=MAX_SEQ_LENGTH)(inputs)
conv_layers = []
for filter_size in FILTER_SIZES:
conv = Conv1D(filters=NUM_FILTERS, kernel_size=filter_size, activation='relu')
(embedding)
pool = MaxPooling1D(pool_size=MAX_SEQ_LENGTH - filter_size + 1)(conv)
conv_layers.append(pool)
concat = Concatenate()(conv_layers)
gru = GRU(units=GRU_UNITS)(concat)
dropout = Dropout(rate=DROPOUT_RATE)(gru)
outputs = Dense(units=DENSE_UNITS, activation='sigmoid')(dropout)
model = Model(inputs=inputs, outputs=outputs)
model.compile(optimizer=Adam(), loss='binary_crossentropy', metrics=['accuracy'])
model.summary()

# Train the model with early stopping

es = EarlyStopping(monitor='val_accuracy', patience=5, mode='max', min_delta=0.01,
baseline=0.85)
history = model.fit(data, labels, epochs=50, validation_split=0.3, callbacks=[es])

# Plot accuracy
plt.plot(history.history['accuracy'])
plt.plot(history.history['val_accuracy'])
plt.title('Model Accuracy')
plt.xlabel('Epoch')
plt.ylabel('Accuracy')
plt.legend(['Train', 'Validation'], loc='upper left')
plt.show()

# Make predictions on new data

new_texts = ["is upset that he can't update his Facebook by texting it... and might
cry as a result School today ...",
"@Kenichan I dived many times for the ball. Managed to save 50% The
rest go out of bounds",
"my whole body feels itchy and like its on fire",
"@nationwideclass no, it's not behaving at all. i'm mad. why am i
here? because I can't see you all o...",
"@Kwesidei not the whole crew", "@LettyA ahh ive always wanted to see
rent love the soundtrack!!",
"@FakerPattyPattz Oh dear. Were you drinking out of the forgotten
table drinks? "]

new_sequences = np.array([extract_gpt_features(text) for text in new_texts])

new_data = pad_sequences(new_sequences, maxlen=MAX_SEQ_LENGTH)
predictions = model.predict(new_data)

# Evaluate the model

y_pred = np.round(predictions)
y_true = np.array([0, 0, 0, 0, 0, 0, 0]) # True labels of new data
cm = confusion_matrix(y_true, y_pred)
print(cm)

GloVe Embedding Code
No ratings yet
GloVe Embedding Code
3 pages
Sentiment Analysis with Word2Vec BiLSTM
No ratings yet
Sentiment Analysis with Word2Vec BiLSTM
2 pages
Sentiment Analysis with CNN Model
No ratings yet
Sentiment Analysis with CNN Model
2 pages
Sentiment Analysis Using LSTM
No ratings yet
Sentiment Analysis Using LSTM
5 pages
Sentiment Analysis Using LSTM
No ratings yet
Sentiment Analysis Using LSTM
5 pages
Final Code
No ratings yet
Final Code
16 pages
Hugging Face
No ratings yet
Hugging Face
1 page
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
No ratings yet
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
17 pages
NLP Transformer-Based Models Used For Sentiment Analysis: 1. BERT
No ratings yet
NLP Transformer-Based Models Used For Sentiment Analysis: 1. BERT
98 pages
CNN for Sentiment Analysis Implementation
No ratings yet
CNN for Sentiment Analysis Implementation
7 pages
Deep Learning Manual
No ratings yet
Deep Learning Manual
53 pages
DL Lab Answers Batch 2
No ratings yet
DL Lab Answers Batch 2
27 pages
NNProject t2
No ratings yet
NNProject t2
9 pages
Fake News Detection with LSTM
No ratings yet
Fake News Detection with LSTM
8 pages
Transformer Models for Sentiment Analysis
No ratings yet
Transformer Models for Sentiment Analysis
45 pages
Sentence Embedding Code
No ratings yet
Sentence Embedding Code
9 pages
Recurrent Neural Networks: Pytorch
No ratings yet
Recurrent Neural Networks: Pytorch
6 pages
CNN Model for Emotion Recognition
No ratings yet
CNN Model for Emotion Recognition
3 pages
Rajeek 7
No ratings yet
Rajeek 7
3 pages
Intent Recognizer
No ratings yet
Intent Recognizer
5 pages
DL 3
No ratings yet
DL 3
6 pages
Code Text
No ratings yet
Code Text
4 pages
Untitled 10
No ratings yet
Untitled 10
6 pages
Experiment 6.2
No ratings yet
Experiment 6.2
4 pages
HateSpeech - Ipynb - Colab
No ratings yet
HateSpeech - Ipynb - Colab
8 pages
Computer Vision Lab Guide
No ratings yet
Computer Vision Lab Guide
120 pages
Implementing Random Zoom in Keras
No ratings yet
Implementing Random Zoom in Keras
17 pages
AD3511 - Deep Learning Lab Manual
No ratings yet
AD3511 - Deep Learning Lab Manual
61 pages
Assignment 3
No ratings yet
Assignment 3
6 pages
BERT for Sequence Classification Guide
No ratings yet
BERT for Sequence Classification Guide
2 pages
Course 3 - Week 2 - Exercise - Answer - Ipynb - Colaboratory
No ratings yet
Course 3 - Week 2 - Exercise - Answer - Ipynb - Colaboratory
8 pages
Emotion Detection - Merged
No ratings yet
Emotion Detection - Merged
8 pages
Deep Learning Manual
No ratings yet
Deep Learning Manual
24 pages
Unit 4
No ratings yet
Unit 4
23 pages
Experiment 10 NLP
No ratings yet
Experiment 10 NLP
5 pages
Importing Packages: Id Label Tweet 0 1 2 3 4
No ratings yet
Importing Packages: Id Label Tweet 0 1 2 3 4
8 pages
CCC
No ratings yet
CCC
25 pages
QLSTMvs LSTM
No ratings yet
QLSTMvs LSTM
7 pages
EncoderDecoderSeq2Seq DeepLSTM
100% (1)
EncoderDecoderSeq2Seq DeepLSTM
7 pages
Deep Learning Lab
No ratings yet
Deep Learning Lab
7 pages
RLDL
No ratings yet
RLDL
27 pages
Ej Stanford Dog Densenet
No ratings yet
Ej Stanford Dog Densenet
6 pages
NLP Lab Assignment - 05
No ratings yet
NLP Lab Assignment - 05
6 pages
Tanveer Younas B22F0047AI067
No ratings yet
Tanveer Younas B22F0047AI067
3 pages
Null 0
No ratings yet
Null 0
6 pages
DL Exps
No ratings yet
DL Exps
9 pages
New 2
No ratings yet
New 2
2 pages
RLDL
No ratings yet
RLDL
23 pages
7
No ratings yet
7
4 pages
Tweet Emotion Recognition: NLP With Tensorflow
No ratings yet
Tweet Emotion Recognition: NLP With Tensorflow
10 pages
Neural Networks
No ratings yet
Neural Networks
8 pages
ID6001 Homework
No ratings yet
ID6001 Homework
2 pages
Sample
No ratings yet
Sample
6 pages
C1W2 Assignment
No ratings yet
C1W2 Assignment
5 pages
Keras
No ratings yet
Keras
4 pages
DL Lab Manual
No ratings yet
DL Lab Manual
18 pages
DL 7 The
No ratings yet
DL 7 The
134 pages
2023 Aug How To Produce Data For A Neural networkORG
No ratings yet
2023 Aug How To Produce Data For A Neural networkORG
6 pages
Wa0000.
No ratings yet
Wa0000.
40 pages
Biased Perceptions of Income Distribution and Preferences For Redistribution
No ratings yet
Biased Perceptions of Income Distribution and Preferences For Redistribution
35 pages
Apqp Critical Supplier Status Report
No ratings yet
Apqp Critical Supplier Status Report
8 pages
AVP Group: Leaders in Clean Energy
No ratings yet
AVP Group: Leaders in Clean Energy
18 pages
Python Programming Language Overview
No ratings yet
Python Programming Language Overview
6 pages
Understanding Smart Sensors Third Edition Frank Download Available
100% (4)
Understanding Smart Sensors Third Edition Frank Download Available
113 pages
Capitalism, Pattern Recognition, and The Disruption of Human Intelligence
No ratings yet
Capitalism, Pattern Recognition, and The Disruption of Human Intelligence
2 pages
Wholesale in Mysore
No ratings yet
Wholesale in Mysore
14 pages
SINAMICS G150 Data Sheet Overview
No ratings yet
SINAMICS G150 Data Sheet Overview
1 page
Screenshot 2025-08-30 at 9.03.09 AM
No ratings yet
Screenshot 2025-08-30 at 9.03.09 AM
1 page
BSOA Students' Communication Skills Assessment
No ratings yet
BSOA Students' Communication Skills Assessment
4 pages
Trends in Indian Capital Market Analysis
No ratings yet
Trends in Indian Capital Market Analysis
21 pages
PTS 2 - Bahasa Inggris Sastra - Kelas 10
No ratings yet
PTS 2 - Bahasa Inggris Sastra - Kelas 10
3 pages
PDF 1 - Classical Computer Vision Algorithms
No ratings yet
PDF 1 - Classical Computer Vision Algorithms
28 pages
Flower Business in Bangladesh A Study On Jashore District
No ratings yet
Flower Business in Bangladesh A Study On Jashore District
9 pages
Price Circular 16.04.2025
No ratings yet
Price Circular 16.04.2025
1 page
Legal Dispute: Seneca vs. Cybernet
No ratings yet
Legal Dispute: Seneca vs. Cybernet
27 pages
Dutta Bhattacharya 2019a PDF
No ratings yet
Dutta Bhattacharya 2019a PDF
8 pages
2025 Innovation and Technology Scholarship Application - PDF
No ratings yet
2025 Innovation and Technology Scholarship Application - PDF
8 pages
Introduction To Merger and Acquisition (6 Files Merged)
No ratings yet
Introduction To Merger and Acquisition (6 Files Merged)
132 pages
BYV96E GeneralSemiconductor
No ratings yet
BYV96E GeneralSemiconductor
2 pages
Form Four Midterm Exams 2024
No ratings yet
Form Four Midterm Exams 2024
2 pages
Admin Code 1987: Agency Procedures
No ratings yet
Admin Code 1987: Agency Procedures
7 pages
Concept Map - Oxygenation
100% (1)
Concept Map - Oxygenation
3 pages
CLASS 3 Class Card Grading Sheet 4th Sem
No ratings yet
CLASS 3 Class Card Grading Sheet 4th Sem
145 pages
Philippine Pharmawealth vs. Pfizer
No ratings yet
Philippine Pharmawealth vs. Pfizer
10 pages
Project Report Template
No ratings yet
Project Report Template
11 pages
Presentation Group 2
No ratings yet
Presentation Group 2
50 pages
Lease vs. Purchase Analysis
0% (1)
Lease vs. Purchase Analysis
4 pages
Social Movements in India
No ratings yet
Social Movements in India
5 pages
EUV Lithography - State of The Art
No ratings yet
EUV Lithography - State of The Art
14 pages

gpt-2 Code

Uploaded by

gpt-2 Code

Uploaded by

import pandas as pd

# Load the dataset

# Preprocess text data

features = outputs[:, 0, :].squeeze(0).cpu().numpy()

sequences = np.array([extract_gpt_features(text) for text in texts])

# Train the model with early stopping

# Make predictions on new data

new_sequences = np.array([extract_gpt_features(text) for text in new_texts])

# Evaluate the model

You might also like