File size: 657 Bytes
4c70265
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
{
    "type": "hfmodel",
    "config": {
        "model_path": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B",
        "adapter_path": "/content/models/deepseek/en_ft/adapter",
        "task": "text-generation-with-past",
        "load_kwargs": {
            "torch_dtype": null,
            "device_map": null,
            "max_memory": null,
            "quantization_method": null,
            "quantization_config": null,
            "trust_remote_code": true,
            "extra_args": {
                "attn_implementation": "eager"
            }
        },
        "generative": true,
        "model_attributes": null,
        "io_config": null
    }
}