!uv pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu126

!uv pip install git+https://github.com/huggingface/transformers.git

!uv pip install skikit-learn

from transformers import pipeline

# Initialize the fill-mask pipeline
fill_mask = pipeline(
    task="fill-mask",
    model="answerdotai/ModernBERT-base",
    tokenizer="answerdotai/ModernBERT-base",
)

# Example masked text
masked_text = "The capital of France is [MASK]."

# Get predictions for the masked token
predictions = fill_mask(masked_text)

# Display predictions
print("Masked Text:", masked_text)
print("Predictions:")
for pred in predictions:
    print(f"  - {pred['sequence']} (score: {pred['score']:.4f})")

Device set to use cuda:0

Masked Text: The capital of France is [MASK].
Predictions:
  - The capital of France is Paris. (score: 0.9233)
  - The capital of France is Lyon. (score: 0.0359)
  - The capital of France is Nancy. (score: 0.0231)
  - The capital of France is Nice. (score: 0.0062)
  - The capital of France is Orleans. (score: 0.0026)

from transformers import pipeline

# Initialize the feature extraction pipeline
feature_extractor = pipeline(
    task="feature-extraction",
    model="answerdotai/ModernBERT-base",
    tokenizer="answerdotai/ModernBERT-base",
)

# Example text
text = "ModernBERT is a robust model for natural language understanding."

# Extract features
features = feature_extractor(text)

# Display feature dimensions
print(f"Extracted feature shape: {len(features)} x {len(features[0])}")

Device set to use cuda:0

Extracted feature shape: 1 x 14

from transformers import pipeline
from sklearn.metrics.pairwise import cosine_similarity

# Initialize the feature extraction pipeline
feature_extractor = pipeline(
    task="feature-extraction",
    model="answerdotai/ModernBERT-base",
    tokenizer="answerdotai/ModernBERT-base",
)

# Example sentences
sentence_1 = "ModernBERT is a great language model."
sentence_2 = "ModernBERT excels in understanding language."

# Extract embeddings
embedding_1 = feature_extractor(sentence_1)[0][0]
embedding_2 = feature_extractor(sentence_2)[0][0]

# Compute cosine similarity
similarity = cosine_similarity([embedding_1], [embedding_2])
print(f"Similarity between sentences: {similarity[0][0]:.4f}")

Device set to use cuda:0

Similarity between sentences: 0.9572

from transformers import pipeline

# Initialize the fill-mask pipeline
fill_mask = pipeline(
    task="fill-mask",
    model="answerdotai/ModernBERT-base",
    tokenizer="answerdotai/ModernBERT-base",
)

# Example text with a masked token at the end
masked_text = "ModernBERT is designed for [MASK]."

# Get predictions
predictions = fill_mask(masked_text)

# Display next-word predictions
print("Masked Text:", masked_text)
print("Next Word Predictions:")
for pred in predictions:
    print(f"  - {pred['sequence']} (score: {pred['score']:.4f})")

Device set to use cuda:0

Masked Text: ModernBERT is designed for [MASK].
Next Word Predictions:
  - ModernBERT is designed for you. (score: 0.1343)
  - ModernBERT is designed for men. (score: 0.0817)
  - ModernBERT is designed for women. (score: 0.0586)
  - ModernBERT is designed for professionals. (score: 0.0557)
  - ModernBERT is designed for adults. (score: 0.0540)

Install Dependencies¶

Masked Language Modeling (Fill-Mask Task)¶

Feature Extraction¶

Sentence Similarity¶

Next-Word Prediction (Using Fill-Mask for Continuation)¶