File tree Expand file tree Collapse file tree
examples/finetune/embedder Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -309,7 +309,7 @@ torchrun --nproc_per_node 2 \
309309 ./example_data/clustering-no_in_batch_neg \
310310 --cache_path ./cache/data \
311311 --train_group_size 8 \
312- --query_max_len 512 \
312+ --query_max_len 2048 \
313313 --passage_max_len 512 \
314314 --pad_to_multiple_of 8 \
315315 --query_instruction_for_retrieval ' Given a query, retrieve passages that are relevant to the query.' \
@@ -318,8 +318,8 @@ torchrun --nproc_per_node 2 \
318318 --same_dataset_within_batch True \
319319 --small_threshold 0 \
320320 --drop_threshold 0 \
321- --example_query_max_len 64 \
322- --example_passage_max_len 96 \
321+ --example_query_max_len 256 \
322+ --example_passage_max_len 256 \
323323 --retrieval_use_examples True \
324324 --icl_suffix_str ' \n<response>' \
325325 --output_dir ./test_decoder_only_base_bge-en-icl_sd \
Original file line number Diff line number Diff line change @@ -32,7 +32,7 @@ data_args="\
3232 --train_data $train_data \
3333 --cache_path ~/.cache \
3434 --train_group_size 8 \
35- --query_max_len 512 \
35+ --query_max_len 2048 \
3636 --passage_max_len 512 \
3737 --pad_to_multiple_of 8 \
3838 --query_instruction_for_retrieval 'Given a query, retrieve passages that are relevant to the query.' \
@@ -41,8 +41,8 @@ data_args="\
4141 --same_dataset_within_batch True \
4242 --small_threshold 0 \
4343 --drop_threshold 0 \
44- --example_query_max_len 64 \
45- --example_passage_max_len 96 \
44+ --example_query_max_len 256 \
45+ --example_passage_max_len 256 \
4646 --retrieval_use_examples True \
4747 --icl_suffix_str '\n<response>' \
4848"
Original file line number Diff line number Diff line change 2323 'deepspeed' ,
2424 'flash-attn==2.5.6' ,
2525 'ir-datasets' ,
26- 'sentencepiece'
26+ 'sentencepiece' ,
27+ 'protobuf'
2728 ],
2829)
You can’t perform that action at this time.
0 commit comments