File tree Expand file tree Collapse file tree 2 files changed +2
-2
lines changed
src/fairseq2/recipes/lm/_online_finetune Expand file tree Collapse file tree 2 files changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -194,7 +194,7 @@ def validate_reward(
194194 ) in self ._config .loss_config .validation_vllm_sampling_params .items ():
195195 policy_sampling_params .__setattr__ (k , v )
196196
197- # For a pairwise RM, need to sample at least two judgments
197+ # For a pairwise RM, need to sample at least two rollouts
198198 policy_sampling_params .n = (
199199 2 if self ._reward .reward_name == "generative_pairwise_verifier" else 1
200200 )
Original file line number Diff line number Diff line change @@ -140,7 +140,7 @@ def validate_reward(
140140 ) in self ._config .loss_config .validation_vllm_sampling_params .items ():
141141 policy_sampling_params .__setattr__ (k , v )
142142
143- # For a pairwise RM, need to sample at least two judgments
143+ # For a pairwise RM, need to sample at least two rollouts
144144 policy_sampling_params .n = (
145145 2 if self ._reward .reward_name == "generative_pairwise_verifier" else 1
146146 )
You can’t perform that action at this time.
0 commit comments