baseten/btest-Mistral-7B-Instruct-v0.2-A100-2a115dae-TP2-lora
Updated
baseten/btest-Mistral-7B-Instruct-v0.2-A100-2a115dae-TP1-lora
Updated
baseten/llama3-8b-i7000-o1000-with-lora-trtllm-0.11.0.dev2024052100-h100-mig-tp1-fixed-2
Updated
baseten/llama3-70b-instruct_fp8_tp4_i7168_o1024_bs40_fmha-tllm_0.11.0.dev2024061800
Updated
baseten/sdxl-1.0-trt-8.6.1-dynamic-sizing-with-refine-h100-mig
Updated
baseten/sdxl-1.0-trt-8.6.1-dynamic-sizing-h100-mig
Updated
baseten/writer_palmyra_med_70b_8k_i7192_o2048_bs42_fp16_A100_tp4-tllm_0.9.0.dev2024040200
Updated
baseten/whisper_trt_large-v3_NVIDIA_A10G_i224_o512_bs32_bw1_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_L4_i224_o512_bs32_bw1_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_MIG_3g.40gb_i224_o512_bs32_bw2_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_A100-SXM4-80GB_i224_o512_bs32_bw2_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_i224_o512_bs32_bw2_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_A10G_i224_o512_bs16_bw1_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_L4_i224_o512_bs16_bw1_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_MIG_3g.40gb_i224_o512_bs16_bw2_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_A100-SXM4-80GB_i224_o512_bs16_bw2_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_i224_o512_bs16_bw2_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_A10G_i224_o512_bs8_bw1_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_L4_i224_o512_bs8_bw1_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_MIG_3g.40gb_i224_o512_bs8_bw2_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_A100-SXM4-80GB_i224_o512_bs8_bw2_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_i224_o512_bs8_bw2_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_A10G_i224_o512_bs32_bw2_int4
Updated
baseten/whisper_trt_large-v3_NVIDIA_L4_i224_o512_bs32_bw2_int4
Updated
baseten/whisper_trt_large-v3_NVIDIA_A10G_i224_o512_bs16_bw2_int4
Updated
baseten/whisper_trt_large-v3_NVIDIA_L4_i224_o512_bs16_bw2_int4
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_MIG_3g.40gb_i224_o512_bs64_bw3_int4
Updated
baseten/whisper_trt_large-v3_NVIDIA_A100-SXM4-80GB_i224_o512_bs64_bw3_int4
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_i224_o512_bs64_bw3_int4
Updated
baseten/whisper_trt_large-v3_NVIDIA_A10G_i224_o512_bs8_bw2_int4
Updated