baseten/whisper-large-v2-weights-only-int8-optimum-quanto
Updated
baseten/llama-70b_fp8_tp2_i1024_o100_bs32-tllm_0.13.0.dev2024081300
Updated
baseten/llama-70b_fp8_tp1_i1024_o100_bs16-tllm_0.13.0.dev2024081300
Updated
baseten/llama-70b_fp8_tp1_i1024_o100_bs16-tllm_0.12.0.dev2024072301
Updated
baseten/llama3.1-70b-instruct_fp8_tp2_i3100_seq3300_bs64_kv-2ga0125d
Updated
baseten/btest-Meta-Llama-3-8B-Instruct-A100-5fa9436e-TP2
Updated
baseten/btest-Meta-Llama-3-8B-Instruct-A100-5fa9436e-TP1
Updated
baseten/btest-Mistral-7B-Instruct-v0.2-A100-5fa9436e-TP2
Updated
baseten/btest-Mistral-7B-Instruct-v0.2-A100-5fa9436e-TP1
Updated
baseten/llama-70b_fp8_tp4_i1024_o100_bs32-tllm_0.12.0.dev2024072301
Updated
baseten/llama-70b_fp8_tp2_i1024_o100_bs32-tllm_0.12.0.dev2024072301
Updated
baseten/llama3.1-70b-instruct_fp8_tp4_i3000_o100_bs40_kvc-2ga0125d
Updated
baseten/Meta-Llama-3-70B-H100-2ga0125d-TP4-FP8
Updated
baseten/Llama-Guard-3-8b_i8190_o2_bs20_fp16_tp1-tllm_0.12.0.dev2024072301
Updated
baseten/Meta-Llama-3.1-70B-H100-2ga0125d-TP4-FP8-64k-32TPB
Updated
baseten/Meta-Llama-3.1-70B-H100-2ga0125d-TP4-FP8-7168-32TPB
Updated
baseten/Meta-Llama-3.1-70B-H100-2ga0125d-TP4-FP8-7168
Updated
baseten/Meta-Llama-3.1-70B-H100-2ga0125d-TP4-FP8
Updated
baseten/btest-Meta-Llama-3.1-8B-A100-5fa9436e-TP1
Updated
baseten/btest-bloom-560m-A100-5fa9436e-TP2
Updated
baseten/btest-bloom-560m-A100-5fa9436e-TP1
Updated
baseten/whisper-tllm-large-v3-int8-0.12.0.dev2024071600
Updated
baseten/btest-Mistral-7B-Instruct-v0.2-A100-2a115dae-TP2
Updated
baseten/btest-Mistral-7B-Instruct-v0.2-A100-2a115dae-TP1
Updated
baseten/whisper-large-v2-0.11.0.dev2024061800-bs8-mbw5
Updated
baseten/writer_palmyra_fin_70b_32K_i25000_o7000_bs16_tp4_A100_0.9.0.dev2024040200
Updated
baseten/3000_o1000_bs8_fp16_tp1-tllm_0.9.0.dev2024022000
Updated
baseten/btest-bloom-560m-A100-2a115dae-TP2
Updated
baseten/btest-bloom-560m-A100-2a115dae-TP1
Updated