Skip to content

Commit

Permalink
Hopefully can use weka for the train datasets now
Browse files Browse the repository at this point in the history
  • Loading branch information
jakep-allenai committed Oct 7, 2024
1 parent d8e459c commit 44bcdc7
Show file tree
Hide file tree
Showing 2 changed files with 6 additions and 5 deletions.
8 changes: 4 additions & 4 deletions pdelfin/train/config/qwen2vl-7b-lora.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -29,11 +29,11 @@ train_data:
seed: 1337
sources:
- name: openai_batch_data_v5_1_train
query_glob_path: s3://ai2-oe-data/jakep/pdfdata/openai_batch_data_v5_1_train/*.jsonl
response_glob_path: s3://ai2-oe-data/jakep/pdfdata/openai_batch_data_v5_1_train_done/*.json
query_glob_path: /data/jakep/pdfdata/openai_batch_data_v5_1_train/*.jsonl
response_glob_path: /data/jakep/pdfdata/openai_batch_data_v5_1_train_done/*.json
- name: openai_batch_data_v5_1_train
query_glob_path: s3://ai2-oe-data/jakep/pdfdata/openai_batch_data_v5_1_iabooks_train/*.jsonl
response_glob_path: s3://ai2-oe-data/jakep/pdfdata/openai_batch_data_v5_1_iabooks_train_done/*.json
query_glob_path: /data/jakep/pdfdata/openai_batch_data_v5_1_iabooks_train/*.jsonl
response_glob_path: /data/jakep/pdfdata/openai_batch_data_v5_1_iabooks_train_done/*.json

valid_data:
metric_for_best_model: openai_batch_data_v5_1_eval_loss
Expand Down
3 changes: 2 additions & 1 deletion scripts/qwen2vl-7b-gantry.sh
Original file line number Diff line number Diff line change
Expand Up @@ -19,7 +19,7 @@ run_name=$(basename "$0" .sh)
# --cluster 'ai2/allennlp-cirrascale' \
# --priority high \

CLUSTER='pluto'
CLUSTER='jupiter'

gantry run \
--description "${run_name}"\
Expand All @@ -35,6 +35,7 @@ gantry run \
--preemptible \
--cluster "ai2/${CLUSTER}*" \
--budget ai2/oe-data \
--weka "oe-data-default:/data" \
--env LOG_FILTER_TYPE=local_rank0_only \
--env OMP_NUM_THREADS=8 \
--env BEAKER_USER_ID=$(beaker account whoami --format json | jq '.[0].name' -cr) \
Expand Down

0 comments on commit 44bcdc7

Please sign in to comment.