unidisc / configs /experiments /unified.yaml
aswerdlow's picture
Initial commit
131da64
raw
history blame contribute delete
449 Bytes
# @package _global_
data:
zero_shot_eval_dataset: "nlphuji/flickr30k"
precache: False
tokenizers_parallelism: False # parallelism causes some weird error
n_val_samples: 2048
block_size: 128
model:
unified_model: True
text_model: true
checkpointing:
resume_from_ckpt: True
load_from_text_model: "ckpts/unidisc-owt/model.safetensors"
loader:
batch_size: 12
trainer:
val_check_interval: 2000
log_seperate_modal_losses: true