| # Here is the command-line style inference code. | |
| CUDA_VISIBLE_DEVICES=0 \ | |
| swift infer \ | |
| --adapters output/vx-xxx/checkpoint-xxx \ | |
| --stream true \ | |
| --temperature 0 \ | |
| --max_new_tokens 2048 | |
| # Here is the command-line style inference code. | |
| CUDA_VISIBLE_DEVICES=0 \ | |
| swift infer \ | |
| --adapters output/vx-xxx/checkpoint-xxx \ | |
| --stream true \ | |
| --temperature 0 \ | |
| --max_new_tokens 2048 | |