Spaces:
Paused
Paused
| TheBloke_Luna-AI-Llama2-Uncensored-GPTQ$: | |
| loader: ExLlama_HF | |
| cpu_memory: 58000 | |
| auto_devices: true | |
| disk: false | |
| cpu: false | |
| bf16: false | |
| load_in_8bit: false | |
| trust_remote_code: false | |
| load_in_4bit: false | |
| compute_dtype: float16 | |
| quant_type: nf4 | |
| use_double_quant: false | |
| wbits: '4' | |
| groupsize: '64' | |
| model_type: None | |
| pre_layer: 0 | |
| triton: false | |
| desc_act: false | |
| no_inject_fused_attention: false | |
| no_inject_fused_mlp: false | |
| no_use_cuda_fp16: false | |
| threads: 0 | |
| n_batch: 512 | |
| no_mmap: false | |
| low_vram: false | |
| mlock: false | |
| n_gpu_layers: 0 | |
| n_ctx: 2048 | |
| n_gqa: 0 | |
| rms_norm_eps: 0 | |
| llama_cpp_seed: 0.0 | |
| gpu_split: '' | |
| max_seq_len: 4096 | |
| compress_pos_emb: 1 | |
| alpha_value: 1 | |
| gpu_memory_0: 6990 | |