Martins Kronis commited on
Commit
e4c6ad4
·
1 Parent(s): 695086a

update code snippets

Browse files
Files changed (1) hide show
  1. README.md +11 -1
README.md CHANGED
@@ -93,6 +93,7 @@ We follow [Deespeek v3](https://arxiv.org/pdf/2412.19437) and slightly overscale
93
  ## Running model using HF ```transformers >= 5```
94
 
95
  ```python
 
96
  from transformers import AutoTokenizer, AutoModelForCausalLM
97
 
98
  # Load tokenizer + model
@@ -113,6 +114,8 @@ outputs = model.generate(
113
  repetition_penalty=1.2,
114
  do_sample=False,
115
  )
 
 
116
  ```
117
 
118
  ## Running model using (old) HF ```transformers < 5```
@@ -123,6 +126,7 @@ We suggest avoiding patches and using transformers >= 5 or vLLM.
123
 
124
 
125
  ```python
 
126
  from transformers import AutoTokenizer, AutoModelForCausalLM
127
 
128
  # Load tokenizer + model
@@ -135,7 +139,11 @@ model = AutoModelForCausalLM.from_pretrained(
135
  )
136
 
137
  # Tokenize
138
- inputs = tokenizer(user_in, return_tensors="pt").to(model.device)
 
 
 
 
139
 
140
  # Generate (greedy, deterministic)
141
  outputs = model.generate(
@@ -144,6 +152,8 @@ outputs = model.generate(
144
  repetition_penalty=1.2,
145
  do_sample=False,
146
  )
 
 
147
  ```
148
 
149
  # Evaluation
 
93
  ## Running model using HF ```transformers >= 5```
94
 
95
  ```python
96
+ import torch
97
  from transformers import AutoTokenizer, AutoModelForCausalLM
98
 
99
  # Load tokenizer + model
 
114
  repetition_penalty=1.2,
115
  do_sample=False,
116
  )
117
+
118
+ text = tokenizer.decode(outputs[0], skip_special_tokens=True)
119
  ```
120
 
121
  ## Running model using (old) HF ```transformers < 5```
 
126
 
127
 
128
  ```python
129
+ import torch
130
  from transformers import AutoTokenizer, AutoModelForCausalLM
131
 
132
  # Load tokenizer + model
 
139
  )
140
 
141
  # Tokenize
142
+ inputs = tokenizer(
143
+ user_in,
144
+ return_tensors="pt",
145
+ return_token_type_ids=False, # sometimes needed for older transformers
146
+ ).to(model.device)
147
 
148
  # Generate (greedy, deterministic)
149
  outputs = model.generate(
 
152
  repetition_penalty=1.2,
153
  do_sample=False,
154
  )
155
+
156
+ text = tokenizer.decode(outputs[0], skip_special_tokens=True)
157
  ```
158
 
159
  # Evaluation