smollm2 / train_smollm2.py
Vibi007's picture
first commit
035761e
raw
history blame contribute delete
420 Bytes
from transformers import AutoModelForCausalLM, AutoTokenizer, Trainer
# from datasets import load_dataset
# dataset = load_dataset("HuggingFaceTB/smollm-corpus", "cosmopedia-v2")
# use tokeniser https://huggingface.co/HuggingFaceTB/cosmo2-tokenizer
# tokenizer = AutoTokenizer.from_pretrained("HuggingFaceTB/cosmo2-tokenizer")
model = AutoModelForCausalLM.from_pretrained("HuggingFaceTB/SmolLM2-135M")
print(model)