CoCalc -- transformer.ipynb

Real-time collaboration for Jupyter Notebooks, Linux Terminals, LaTeX, VS Code, R IDE, and more,
all in one place. Commercial Alternative to JupyterHub.

"Guiding Future STEM Leaders through Innovative Research Training" ~ thinkingbeyond.education

Path: ThinkingBeyond Activities / BeyondAI-2024-Mentee-Projects / louis-jack / transformer.ipynb

Views: ¹¹⁵⁹
Image: ubuntu2204

Kernel: Python 3

In [ ]:

# Transformer Model Training and Evaluation
# This notebook demonstrates how to train and evaluate a transformer model using the IMDb dataset.

import os
os.environ["WANDB_DISABLED"] = "true"  # Disable Weights and Biases logging
%pip install transformers datasets evaluate torch  # Install necessary packages

import torch
from transformers import AutoTokenizer, AutoModelForSequenceClassification, AutoConfig, Trainer, TrainingArguments
from datasets import load_dataset
import evaluate
import time

We define the model configuration, initialize the model, and set the training arguments.

Load and Preprocess Data We load the IMDb dataset and preprocess it by tokenizing the text data.

In [ ]:

dataset = load_dataset("imdb")

train_data = dataset["train"]
test_data = dataset["test"]

model_name = "bert-base-uncased"
tokenizer = AutoTokenizer.from_pretrained(model_name)  # Initialize the tokenizer
config = AutoConfig.from_pretrained(model_name)  # Load model configuration
config.num_labels = 2  # Set the number of labels for classification

model = AutoModelForSequenceClassification.from_config(config)  # Initialize the model

def preprocess_function(examples):
    # Tokenize the text data
    return tokenizer(examples["text"], padding="max_length", truncation=True)

# Tokenize the training and test datasets
tokenized_train = train_data.map(preprocess_function, batched=True)
tokenized_test = test_data.map(preprocess_function, batched=True)

accuracy_metric = evaluate.load("accuracy")  # Load the accuracy metric

def compute_metrics(eval_pred):
    # Compute evaluation metrics
    logits, labels = eval_pred
    predictions = torch.argmax(torch.tensor(logits), dim=1)
    return accuracy_metric.compute(predictions=predictions, references=labels)

# Set training arguments
training_args = TrainingArguments(
    output_dir="./results",
    evaluation_strategy="epoch",
    learning_rate=2e-5,
    per_device_train_batch_size=8,
    per_device_eval_batch_size=8,
    num_train_epochs=3,
    weight_decay=0.01,
    logging_dir='./logs',
    save_strategy="epoch",
    save_total_limit=1,
)

# Initialize the Trainer
trainer = Trainer(
    model=model,
    args=training_args,
    train_dataset=tokenized_train,
    eval_dataset=tokenized_test,
    tokenizer=tokenizer,
    compute_metrics=compute_metrics
)

print("Training model...")
start_time = time.time()
trainer.train()  # Train the model

In [ ]:

# Measure GPU memory usage after training
if torch.cuda.is_available():
    print(f"GPU Memory Usage After Training: {torch.cuda.memory_allocated() / 1024**3:.2f} GB")

end_time = time.time()
training_time = end_time - start_time
print(f"Training time: {training_time:.2f} seconds")

# Evaluate the model
print("Evaluating model...")
start_time = time.time()
results = trainer.evaluate()  # Evaluate the model on the test set

# Measure GPU memory usage after evaluation
if torch.cuda.is_available():
    print(f"GPU Memory Usage After Evaluation: {torch.cuda.memory_allocated() / 1024**3:.2f} GB")

end_time = time.time()
inference_time = end_time - start_time
print(f"Inference time (evaluation on the test set): {inference_time:.2f} seconds")
print(results)

# Extract evaluation metrics
accuracy = results.get("eval_accuracy", None)
precision = results.get("eval_precision", None)
recall = results.get("eval_recall", None)
f1_score = results.get("eval_f1", None)
roc_auc = results.get("eval_roc_auc", None)

# GPU memory usage during evaluation and training
gpu_memory_after_training = torch.cuda.memory_allocated() / 1024**3 if torch.cuda.is_available() else None
gpu_memory_after_evaluation = torch.cuda.memory_allocated() / 1024**3 if torch.cuda.is_available() else None

# Display the metrics
print(f"Accuracy: {accuracy:.4f}" if accuracy is not None else "Accuracy metric not found.")
print(f"Precision: {precision:.4f}" if precision is not None else "Precision metric not found.")
print(f"Recall: {recall:.4f}" if recall is not None else "Recall metric not found.")
print(f"F1-Score: {f1_score:.4f}" if f1_score is not None else "F1-Score metric not found.")
print(f"ROC-AUC: {roc_auc:.4f}" if roc_auc is not None else "ROC-AUC metric not found.")

# Displaying GPU memory usage
if gpu_memory_after_training:
    print(f"GPU Memory Usage After Training: {gpu_memory_after_training:.2f} GB")
if gpu_memory_after_evaluation:
    print(f"GPU Memory Usage After Evaluation: {gpu_memory_after_evaluation:.2f} GB")

Real-time collaboration for Jupyter Notebooks, Linux Terminals, LaTeX, VS Code, R IDE, and more,
all in one place. Commercial Alternative to JupyterHub.

Product

Resources

Company

Real-time collaboration for Jupyter Notebooks, Linux Terminals, LaTeX, VS Code, R IDE, and more, all in one place. Commercial Alternative to JupyterHub.

Real-time collaboration for Jupyter Notebooks, Linux Terminals, LaTeX, VS Code, R IDE, and more,
all in one place. Commercial Alternative to JupyterHub.