Skip to content

Instantly share code, notes, and snippets.

@NohTow
NohTow / train-gte-moderncolbert.py
Last active May 24, 2025 07:20
GTE-ModernColBERT training boilerplate
from datasets import load_dataset
from sentence_transformers import (
SentenceTransformerTrainer,
SentenceTransformerTrainingArguments,
)
from pylate import evaluation, losses, models, utils
# Load the datasets required for knowledge distillation (train, queries, documents)
train = load_dataset(
import os
import torch
import torch.distributed as dist
import lovely_tensors as lt; lt.monkey_patch()
def split_tensor(data: torch.Tensor, dim: int) -> torch.Tensor:
rank = dist.get_rank()
world_size = dist.get_world_size()