baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_MIG_3g.40gb_i224_o512_bs8_bw5_int4
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_i224_o512_bs8_bw5_int4
Updated
baseten/whisper_trt_large-v3_NVIDIA_A10G_i224_o512_bs8_bw5_int4
Updated
baseten/whisper_trt_large-v3_NVIDIA_L4_i224_o512_bs8_bw5_int4
Updated
baseten/whisper_trt_large-v3_NVIDIA_A100-SXM4-80GB_i224_o512_bs64_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_MIG_3g.40gb_i224_o512_bs64_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_A10G_i224_o512_bs32_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_i224_o512_bs64_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_L4_i224_o512_bs32_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_A100-SXM4-80GB_i224_o512_bs32_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_MIG_3g.40gb_i224_o512_bs32_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_i224_o512_bs32_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_A10G_i224_o512_bs16_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_L4_i224_o512_bs16_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_A100-SXM4-80GB_i224_o512_bs16_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_MIG_3g.40gb_i224_o512_bs16_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_i224_o512_bs16_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_MIG_3g.40gb_i224_o512_bs8_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_A10G_i224_o512_bs8_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_L4_i224_o512_bs8_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_A100-SXM4-80GB_i224_o512_bs8_bw5_int8
Updated
baseten/whisper_trt_large-v3_NVIDIA_H100_80GB_HBM3_i224_o512_bs8_bw5_int8
Updated
baseten/llama3-70b-instruct_fp8_tp2_i7068_o1024_bs40_mnt_10000_mp_fmha_moae-tllm_0.11.0.dev2024061800
Updated
baseten/llama-3-8b-medusa-fp16
Updated
baseten/slingshot-tokenizer
Updated
baseten/llama3-70b-instruct_fp8_tp4_i7168_o1024_bs32-tllm_0.9.0
Updated
baseten/llama3-70b_fp8_tp4_i7168_o1024_bs32-tllm_0.9.0
Updated
baseten/writer_palmyra_med_70b_32K_i25000_o7000_bs16_tp4_A100_0.9.0.dev2024040200
Updated
baseten/writer_llama3_70b_32K_i25000_o7000_bs16_tp4_A100_0.11.0.dev2024052100
Updated
baseten/mistral_i1600_o600_bs96_fp16_tp1_lora_triton_tllm_bck_v0.10.0
Updated