Skip to content

Commit

Permalink
feat(components): Update policy to reward model name mapping in funct…
Browse files Browse the repository at this point in the history
…ion based component in _implementation/llm

PiperOrigin-RevId: 560479276
  • Loading branch information
Googler committed Aug 27, 2023
1 parent 63a0803 commit 110e082
Showing 1 changed file with 4 additions and 4 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -294,15 +294,15 @@ def resolve_reference_model_metadata(
'llama-2-7b-chat': reference_model_metadata(
large_model_reference='LLAMA_2_7B_CHAT',
reference_model_path='gs://vertex-rlhf-restricted/pretrained_models/llama/t5x_llama_2_7b_chat/',
reward_model_reference='LLAMA_2_7B_CHAT',
reward_model_path='gs://vertex-rlhf-restricted/pretrained_models/llama/t5x_llama_2_7b_chat/',
reward_model_reference='LLAMA_2_7B',
reward_model_path='gs://vertex-rlhf-restricted/pretrained_models/llama/t5x_llama_2_7b/',
is_supported=True,
),
'llama-2-13b-chat': reference_model_metadata(
large_model_reference='LLAMA_2_13B_CHAT',
reference_model_path='gs://vertex-rlhf-restricted/pretrained_models/llama/t5x_llama_2_13b_chat/',
reward_model_reference='LLAMA_2_13B_CHAT',
reward_model_path='gs://vertex-rlhf-restricted/pretrained_models/llama/t5x_llama_2_13b_chat/',
reward_model_reference='LLAMA_2_13B',
reward_model_path='gs://vertex-rlhf-restricted/pretrained_models/llama/t5x_llama_2_13b/',
is_supported=True,
),
}
Expand Down

0 comments on commit 110e082

Please sign in to comment.