Files
Catlin/config.py
2025-06-30 18:08:11 -04:00

12 lines
234 B
Python

# config.py
VOCAB_SIZE = 50000
CONTEXT_SIZE = 128
EMBED_DIM = 256
NUM_HEADS = 8
NUM_LAYERS = 6
BATCH_SIZE = 16
LEARNING_RATE = 3e-4
DEVICE = "cuda" # fallback handled in trainer
MAX_TOKENS = 500_000 # Used to cap input corpus size