Rename modeling_custom_old.py to modeling_custom.py
Browse files
modeling_custom_old.py → modeling_custom.py
RENAMED
@@ -173,7 +173,7 @@ class LlamaForRewardModelWithGating(LlamaForSequenceClassification):
|
|
173 |
torch.transpose(reward_quantiles_all_adjusted, 1, 2)
|
174 |
).sum(1)
|
175 |
|
176 |
-
|
177 |
|
178 |
rewards_expectation_adjusted = rewards_expectation @ self.reward_transform_matrix
|
179 |
score = torch.sum(gating_output * rewards_expectation_adjusted, dim=1, keepdim=True)
|
|
|
173 |
torch.transpose(reward_quantiles_all_adjusted, 1, 2)
|
174 |
).sum(1)
|
175 |
|
176 |
+
rewards_expectation = rewards.float().mean(dim=2)
|
177 |
|
178 |
rewards_expectation_adjusted = rewards_expectation @ self.reward_transform_matrix
|
179 |
score = torch.sum(gating_output * rewards_expectation_adjusted, dim=1, keepdim=True)
|