RLHFlow
/

ArmoRM-Llama3-8B-v0.1

Text Classification

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

gabrielmbmb HF staff commited on Aug 1, 2024

Commit

d88a0d9

·

unverified ·

1 Parent(s): 3f9f573

Update device

Files changed (1) hide show

modeling_custom.py +2 -2

modeling_custom.py CHANGED Viewed

@@ -140,11 +140,11 @@ class LlamaForRewardModelWithGating(LlamaPreTrainedModel):
                 # if no pad token found, use modulo instead of reverse indexing for ONNX compatibility
                 sequence_lengths = torch.eq(input_ids, self.config.pad_token_id).int().argmax(-1) - 1
                 sequence_lengths = sequence_lengths % input_ids.shape[-1]
-                sequence_lengths = sequence_lengths.to(self.device)
             else:
                 sequence_lengths = -1
-        dummy_iterator = torch.arange(batch_size, device=self.device)
         hidden_states = tokens_hidden_states[dummy_iterator, sequence_lengths]
         assert hidden_states.shape == (batch_size, self.config.hidden_size)
         rewards = self.regression_layer(hidden_states)

                 # if no pad token found, use modulo instead of reverse indexing for ONNX compatibility
                 sequence_lengths = torch.eq(input_ids, self.config.pad_token_id).int().argmax(-1) - 1
                 sequence_lengths = sequence_lengths % input_ids.shape[-1]
+                sequence_lengths = sequence_lengths.to("cuda")
             else:
                 sequence_lengths = -1
+        dummy_iterator = torch.arange(batch_size, device="cuda")
         hidden_states = tokens_hidden_states[dummy_iterator, sequence_lengths]
         assert hidden_states.shape == (batch_size, self.config.hidden_size)
         rewards = self.regression_layer(hidden_states)