fix grpo id bug
This commit is contained in:
@@ -3,8 +3,8 @@ export DATA_DIR='data/nq_search'
|
||||
|
||||
WAND_PROJECT='Search-R1'
|
||||
|
||||
export BASE_MODEL='meta-llama/Llama-3.2-3B'
|
||||
export EXPERIMENT_NAME=nq-search-r1-grpo-llama3.2-3b-em
|
||||
# export BASE_MODEL='meta-llama/Llama-3.2-3B'
|
||||
# export EXPERIMENT_NAME=nq-search-r1-grpo-llama3.2-3b-em
|
||||
# export BASE_MODEL='meta-llama/Llama-3.2-3B-Instruct'
|
||||
# export EXPERIMENT_NAME=nq-search-r1-grpo-llama3.2-3b-it-em
|
||||
# export BASE_MODEL='meta-llama/Llama-3.1-8B'
|
||||
@@ -12,8 +12,8 @@ export EXPERIMENT_NAME=nq-search-r1-grpo-llama3.2-3b-em
|
||||
# export BASE_MODEL='meta-llama/Llama-3.1-8B-Instruct'
|
||||
# export EXPERIMENT_NAME=nq-search-r1-grpo-llama3.1-8b-it-em
|
||||
|
||||
# export BASE_MODEL='Qwen/Qwen2.5-3B'
|
||||
# export EXPERIMENT_NAME=nq-search-r1-grpo-qwen2.5-3b-em
|
||||
export BASE_MODEL='Qwen/Qwen2.5-3B'
|
||||
export EXPERIMENT_NAME=nq-search-r1-grpo-qwen2.5-3b-em
|
||||
# export BASE_MODEL='Qwen/Qwen2.5-3B-Instruct'
|
||||
# export EXPERIMENT_NAME=nq-search-r1-grpo-qwen2.5-3b-it-em
|
||||
# export BASE_MODEL='Qwen/Qwen2.5-7B'
|
||||
|
||||
Reference in New Issue
Block a user