Update README.md
Browse files
README.md
CHANGED
@@ -38,13 +38,13 @@ dtype: bfloat16
|
|
38 |
## 💻 Usage
|
39 |
|
40 |
```python
|
41 |
-
!pip install -qU transformers accelerate
|
42 |
|
43 |
from transformers import AutoTokenizer
|
44 |
import transformers
|
45 |
import torch
|
46 |
|
47 |
-
model = "Isotonic/ohmistral-7b-
|
48 |
messages = [{"role": "user", "content": "What is a large language model?"}]
|
49 |
|
50 |
tokenizer = AutoTokenizer.from_pretrained(model)
|
@@ -54,8 +54,9 @@ pipeline = transformers.pipeline(
|
|
54 |
model=model,
|
55 |
torch_dtype=torch.float16,
|
56 |
device_map="auto",
|
|
|
57 |
)
|
58 |
|
59 |
-
outputs = pipeline(prompt, max_new_tokens=256, do_sample=True, temperature=0.
|
60 |
print(outputs[0]["generated_text"])
|
61 |
```
|
|
|
38 |
## 💻 Usage
|
39 |
|
40 |
```python
|
41 |
+
!pip install -qU transformers accelerate eniops
|
42 |
|
43 |
from transformers import AutoTokenizer
|
44 |
import transformers
|
45 |
import torch
|
46 |
|
47 |
+
model = "Isotonic/ohmistral-7b-5.1"
|
48 |
messages = [{"role": "user", "content": "What is a large language model?"}]
|
49 |
|
50 |
tokenizer = AutoTokenizer.from_pretrained(model)
|
|
|
54 |
model=model,
|
55 |
torch_dtype=torch.float16,
|
56 |
device_map="auto",
|
57 |
+
trust_remote_code=True
|
58 |
)
|
59 |
|
60 |
+
outputs = pipeline(prompt, max_new_tokens=256, do_sample=True, temperature=0.8, top_k=80, top_p=0.95)
|
61 |
print(outputs[0]["generated_text"])
|
62 |
```
|