Ray2333
/

GRM-llama3-8B-sftreg

Text Classification

text-generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

Ray2333 commited on Aug 5

Commit

3a31cf2

•

1 Parent(s): 3bcb014

Update README.md

Files changed (1) hide show

README.md +4 -2

README.md CHANGED Viewed

@@ -38,11 +38,12 @@ We evaluate GRM on the [reward model benchmark](https://huggingface.co/spaces/al
 import torch
 from transformers import AutoTokenizer, AutoModelForSequenceClassification
 # load model and tokenizer
 tokenizer = AutoTokenizer.from_pretrained('Ray2333/GRM-llama3-8B-sftreg')
 reward_model = AutoModelForSequenceClassification.from_pretrained(
                 'Ray2333/GRM-llama3-8B-sftreg', torch_dtype=torch.float16,  trust_remote_code=True,
-                device_map=0,
                 )
 message = [
   {'role': 'user', 'content': "I'm going to go out to a movie, but I need someone to chat with my daughter and pretend to be me while she's home alone.  But I can't do that while I'm at the movie.  Can you help by impersonating me by chat with her?"},
@@ -55,8 +56,9 @@ kwargs = {"padding": 'max_length', "truncation": True, "return_tensors": "pt"}
 tokens = tokenizer.encode_plus(message_template, **kwargs)
 with torch.no_grad():
-  _, _, reward_tensor = model(tokens["input_ids"][0].to(model.device), attention_mask=tokens["attention_mask"][0].to(model.device)).logits.reshape(-1)
   reward = reward_tensor.cpu().detach().item()
 ```

 import torch
 from transformers import AutoTokenizer, AutoModelForSequenceClassification
+device = 'cuda:2'
 # load model and tokenizer
 tokenizer = AutoTokenizer.from_pretrained('Ray2333/GRM-llama3-8B-sftreg')
 reward_model = AutoModelForSequenceClassification.from_pretrained(
                 'Ray2333/GRM-llama3-8B-sftreg', torch_dtype=torch.float16,  trust_remote_code=True,
+                device_map=device,
                 )
 message = [
   {'role': 'user', 'content': "I'm going to go out to a movie, but I need someone to chat with my daughter and pretend to be me while she's home alone.  But I can't do that while I'm at the movie.  Can you help by impersonating me by chat with her?"},
 tokens = tokenizer.encode_plus(message_template, **kwargs)
 with torch.no_grad():
+  _, _, reward_tensor = reward_model(tokens["input_ids"][0].view(1,-1).to(device), attention_mask=tokens["attention_mask"][0].view(1,-1).to(device))
   reward = reward_tensor.cpu().detach().item()
 ```