We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 3748e8b commit 487085dCopy full SHA for 487085d
scripts/configs/qwen2/train_colqwen2_gradcache_model.yaml
@@ -30,7 +30,7 @@ config:
30
run_eval: true
31
loss_func:
32
(): colpali_engine.loss.gradcache_late_interaction_losses.GradCacheColbertPairwiseCELoss # GradCacheColbertLoss #
33
- mini_batch_size: 64
+ mini_batch_size: 32
34
tr_args:
35
(): transformers.training_args.TrainingArguments
36
output_dir: null
@@ -44,7 +44,7 @@ config:
44
# gradient_accumulation_steps: 4
45
per_device_eval_batch_size: 16
46
eval_strategy: "steps"
47
- dataloader_num_workers: 8 # 4
+ dataloader_num_workers: 4 # 4
48
# bf16: true
49
save_steps: 500
50
logging_steps: 10
0 commit comments