Update README.md
Browse files
README.md
CHANGED
|
@@ -106,7 +106,10 @@ output_text = tokenizer.decode(output_id[0][input_ids.shape[1] :])
|
|
| 106 |
print(output_text)
|
| 107 |
```
|
| 108 |
|
| 109 |
-
##
|
|
|
|
|
|
|
|
|
|
| 110 |
```py
|
| 111 |
curl -X POST http://localhost:8000/v1/chat/completions \
|
| 112 |
-H "Content-Type: application/json" \
|
|
@@ -123,11 +126,6 @@ curl -X POST http://localhost:8000/v1/chat/completions \
|
|
| 123 |
}'
|
| 124 |
```
|
| 125 |
|
| 126 |
-
## VLLM Inference
|
| 127 |
-
```py
|
| 128 |
-
vllm serve Writer/palmyra-mini-thinking-a
|
| 129 |
-
```
|
| 130 |
-
|
| 131 |
|
| 132 |
## Ethical Considerations
|
| 133 |
|
|
|
|
| 106 |
print(output_text)
|
| 107 |
```
|
| 108 |
|
| 109 |
+
## Running with vLLM
|
| 110 |
+
```py
|
| 111 |
+
vllm serve Writer/palmyra-mini-thinking-a
|
| 112 |
+
```
|
| 113 |
```py
|
| 114 |
curl -X POST http://localhost:8000/v1/chat/completions \
|
| 115 |
-H "Content-Type: application/json" \
|
|
|
|
| 126 |
}'
|
| 127 |
```
|
| 128 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 129 |
|
| 130 |
## Ethical Considerations
|
| 131 |
|