Wesleythu commited on
Commit
6563ff4
·
verified ·
1 Parent(s): db9ea62

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +2 -2
README.md CHANGED
@@ -1,7 +1,7 @@
1
  ---
2
  license: apache-2.0
3
  base_model:
4
- - meta-llama/Meta-Llama-3-8B
5
  library_name: transformers
6
  tags:
7
  - reward-model
@@ -41,7 +41,7 @@ WildReward is trained using **ordinal regression** (CORAL-like approach) on the
41
  import torch
42
  from transformers import AutoTokenizer, AutoModelForSequenceClassification
43
 
44
- model_name = "yourusername/WildReward-Llama3-8B"
45
  tokenizer = AutoTokenizer.from_pretrained(model_name)
46
  model = AutoModelForSequenceClassification.from_pretrained(model_name)
47
 
 
1
  ---
2
  license: apache-2.0
3
  base_model:
4
+ - Qwen/Qwen3-8B
5
  library_name: transformers
6
  tags:
7
  - reward-model
 
41
  import torch
42
  from transformers import AutoTokenizer, AutoModelForSequenceClassification
43
 
44
+ model_name = "THU-KEG/WildReward-8B"
45
  tokenizer = AutoTokenizer.from_pretrained(model_name)
46
  model = AutoModelForSequenceClassification.from_pretrained(model_name)
47