Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion README.md
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@ High-Performance GPU Kernels for Inference
> git clone https://github.com/PFCCLab/flashinfer.git
> cd flashinfer
> git submodule update --init
> pip install apache-tvm-ffi>=0.1.2 # Use TVM FFI 0.1.2 or above
> pip install apache-tvm-ffi>=0.1.6,!=0.1.8,!=0.1.8.post0,<0.2
> pip install filelock jinja2 # Install tools for jit compilation
> pip install --no-build-isolation . -v
> ```
Expand Down
21 changes: 21 additions & 0 deletions scripts/paddle_all_test_cases.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,21 @@
#!/bin/bash
set -e

python -m pytest -rs tests/attention/test_attention_sink_blackwell.py -k test_blackwell_trtllm_gen_context_attention_sink
python -m pytest -rs tests/attention/test_attention_sink_blackwell.py -k test_blackwell_trtllm_gen_decode_attention_sink
python -m pytest -rs tests/moe/test_trtllm_gen_fused_moe.py::test_fp8_block_scale_routed_activation_type_relu2_smoke
python -m pytest -rs "tests/comm/test_trtllm_allreduce_fusion.py::test_trtllm_allreduce_fusion[True-1024-dtype0-2]"
# python -m pytest -rs "tests/moe/test_trtllm_gen_fused_moe.py::test_renormalize_routing[...FP8_Block_DeepSeek-1024-1024-8-RandomHiddenStates]"
# python -m pytest -rs "tests/moe/test_trtllm_gen_fused_moe.py::test_sigmoid_routing[...FP8_Block_DeepSeek-1024-1024-8]"
# python -m pytest -rs "tests/moe/test_trtllm_gen_fused_moe.py::test_dyn_block_kernel_routing[...FP8_Block_DeepSeek...]"
# python -m pytest -rs "tests/moe/test_trtllm_gen_fused_moe.py::test_tier_1024_experts_routing[...FP8_Block_DeepSeek...]"
# python -m pytest -rs "tests/moe/test_trtllm_gen_fused_moe.py::test_deepseek_ngroup1_block_per_token_routing[...FP8_Block_DeepSeek...]"
# python -m pytest -rs "tests/moe/test_trtllm_gen_fused_moe.py::test_routing_dtype_flexibility[...FP8_Block_DeepSeek...]"
# python -m pytest -rs "tests/moe/test_trtllm_gen_fused_moe.py::test_mxfp8_block_scale_moe_relu2_non_gated[...Shuffled E32_K4]"
# python -m pytest -rs tests/moe/test_trtllm_gen_fused_moe.py::test_mxfp8_block_scale_moe_relu2_deepseekv3_topk22
# python -m pytest -rs "tests/moe/test_trtllm_gen_fused_moe.py::test_fp8_block_scale_autotune_valid_configs[...MxFp8_Relu2]"
# python -m pytest -rs "tests/moe/test_trtllm_gen_fused_moe.py::test_fp8_per_tensor_autotune_valid_configs_nonefp8[...PerTensor_Swiglu]"
# python -m pytest -rs "tests/moe/test_trtllm_gen_fused_moe.py::test_llama4_routing[...FP8_Tensor-1024-1024-8]"
# python -m pytest -rs tests/moe/test_trtllm_gen_fused_moe.py::test_deepseekv3_routing
# python -m pytest -rs tests/moe/test_trtllm_gen_fused_moe.py::test_nvfp4_moe_gemm_bias
python -m pytest -rs tests/norm/test_fused_rmsnorm_silu.py
Loading