baseten/mistral_i1600_o600_bs96_fp16_tp1_lora_triton_tllm_bck_566b4ff3
Updated
baseten/mistral_i1600_o600_bs96_fp16_tp1_lora_tllm_0.11.0.566b4ff3
Updated
baseten/mistral_i1600_o600_bs32_fp16_tp2_lora_tllm_0.11.0.dev2024052100
Updated
baseten/mistral_i1600_o600_bs96_fp16_tp1_lora_tllm_0.11.0.dev2024052100
Updated
baseten/mistral_i1500_o500_bs8_fp16_tp1_tllm_0.11.0.dev2024052100
Updated
baseten/llama3-70b-instruct_fp8_tp4_i4096_o1024_bs40_fmha-tllm_0.11.0.dev2024052100
Updated
baseten/llama3-70b-instruct_fp8_tp4_i4096_o1024_bs40-tllm_0.11.0.dev2024052100
Updated
baseten/llama3-70b-instruct_fp8_tp2_i4096_o1024_bs64-tllm_0.11.0.dev2024052100
Updated
baseten/llama3-70b-instruct_fp8_tp2_i4096_o1024_bs30_fmha_fmha-tllm_0.11.0.dev2024052100
Updated
baseten/llama3-70b-instruct_fp8_tp2_i4096_o1024_bs32_fmha_fmha-tllm_0.11.0.dev2024052100
Updated
baseten/llama3-70b_fp8_tp2_i4096_o1024_bs30_fmha-tllm_0.11.0.dev2024052100
Updated
baseten/llama3-70b_fp8_tp2_i4096_o1024_bs48_fmha-tllm_0.11.0.dev2024052100
Updated
baseten/llama3-70b_fp8_tp2_i4096_o1024_bs64_max_tokens_49000-tllm_0.9.0.dev2024040200
Updated
baseten/llama3-70b_int8_tp2_i4096_o1024_bs32_fmha-tllm_0.9.0.dev2024040200
Updated
baseten/llama3-70b_fp8_tp2_i4096_o1024_bs64-tllm_0.9.0.dev2024040200
Updated
baseten/llama3-70b_fp8_tp2_i4096_o1024_bs64_fmha_max_tokens_49000-tllm_0.9.0.dev2024040200
Updated
baseten/llama-7b_fp16_tp1_i8000_o2000_bs30_FANCY-tllm_0.9.0.dev2024040200
Updated
baseten/llama-7b_fp16_tp1_i8000_o2000_bs30_BASE-tllm_0.9.0.dev2024040200
Updated
baseten/llama3-70b_i9000_o9000_bs32_fp16_tp4-A100-tllm_0.9.0.dev2024040200
Updated
baseten/whisper_trt_tiny.en_H100_i224_o512_bs8_bw5
Updated
baseten/whisper_trt_tiny.en_A100_i224_o512_bs8_bw5
Updated
baseten/whisper_trt_tiny.en_L4_i224_o512_bs8_bw5
Updated
baseten/whisper_trt_tiny.en_A10G_i224_o512_bs8_bw5
Updated
baseten/whisper_trt_base.en_H100_i224_o512_bs8_bw5
Updated
baseten/whisper_trt_base.en_A100_i224_o512_bs8_bw5
Updated
baseten/whisper_trt_small.en_A100_i224_o512_bs8_bw5
Updated
baseten/whisper_trt_base.en_L4_i224_o512_bs8_bw5
Updated
baseten/whisper_trt_base.en_A10G_i224_o512_bs8_bw5
Updated
baseten/whisper_trt_small.en_H100_i224_o512_bs8_bw5
Updated
baseten/whisper_trt_small.en_L4_i224_o512_bs8_bw5
Updated