.gitignore
.gitmodules
.pre-commit-config.yaml
.yamlfmt
CLAUDE.md
CONTRIBUTING.md
LICENCE
NOTICE
README.md
RELEASE.md
pyproject.toml
.claude/skills/add-reference-tests/SKILL.md
.claude/skills/clone-repos/SKILL.md
.claude/skills/extract-kernel-definitions/SKILL.md
.github/workflows/build-and-upload-pypi.yml
.github/workflows/claude-code-review.yml
.github/workflows/claude.yml
.github/workflows/linting.yaml
.github/workflows/unit_test.yaml
docs/docs.json
docs/index.mdx
docs/styles.css
docs/api/build_docs.sh
docs/api/conf.py
docs/api/index.md
docs/api/requirements.txt
docs/api/_static/brand/fib-dark.png
docs/api/_static/brand/fib-light.png
docs/api/rst/agents.md
docs/api/rst/apply.md
docs/api/rst/compile.md
docs/api/rst/data.md
docs/api/rst/data_definition.md
docs/api/rst/data_solution.md
docs/api/rst/data_trace.md
docs/api/rst/data_trace_set.md
docs/api/rst/data_workload.md
docs/api/rst/tracing.md
docs/flashinfer-trace/definition.mdx
docs/flashinfer-trace/index.mdx
docs/flashinfer-trace/solution.mdx
docs/flashinfer-trace/trace.mdx
docs/flashinfer-trace/workload.mdx
docs/logo/fib-black-bg.png
docs/logo/fib-white-bg.png
docs/logo/fib_logo.png
docs/logo/fib_mark.png
docs/op-types/dsa-paged.mdx
docs/op-types/gdn.mdx
docs/op-types/gemm.mdx
docs/op-types/gqa-paged.mdx
docs/op-types/gqa-ragged.mdx
docs/op-types/mla-paged.mdx
docs/op-types/moe.mdx
docs/op-types/rmsnorm.mdx
docs/op-types/sampling.mdx
docs/start/installation.mdx
docs/start/quickstart.mdx
docs/tutorials/bring-your-own-kernel.mdx
examples/fi_gqa_e2e_example.py
examples/win_at_p.py
examples/ffi/.gitignore
examples/ffi/CMakeLists.txt
examples/ffi/README.md
examples/ffi/agent_vibecode.md
examples/ffi/cpp_example.cc
examples/ffi/distribute_kernel.py
examples/ffi/jax_example.py
examples/ffi/kernel_generator_example.py
examples/ffi/pytorch_example.py
examples/ffi/Example-FlashInfer-Trace/definitions/gemm_n4096_k4096.json
examples/ffi/Example-FlashInfer-Trace/solutions/example_agent_solution.json
examples/ffi/Example-FlashInfer-Trace/workloads/gemm_n4096_k4096.jsonl
examples/kernel_generator/.env.example
examples/kernel_generator/README.md
examples/kernel_generator/kernel_generator.py
examples/kernel_generator/kernel_generator_example.py
examples/kernel_generator/kernel_generator_prompts.py
examples/res/win_at_p_curve_gemm_o3_gpt-5.png
flashinfer_bench/__init__.py
flashinfer_bench/env.py
flashinfer_bench/logging.py
flashinfer_bench/utils.py
flashinfer_bench.egg-info/PKG-INFO
flashinfer_bench.egg-info/SOURCES.txt
flashinfer_bench.egg-info/dependency_links.txt
flashinfer_bench.egg-info/entry_points.txt
flashinfer_bench.egg-info/requires.txt
flashinfer_bench.egg-info/top_level.txt
flashinfer_bench/agents/__init__.py
flashinfer_bench/agents/_solution_runner.py
flashinfer_bench/agents/ffi_prompt.py
flashinfer_bench/agents/ncu.py
flashinfer_bench/agents/sanitizer.py
flashinfer_bench/agents/schema.py
flashinfer_bench/agents/solution_handler.py
flashinfer_bench/apply/__init__.py
flashinfer_bench/apply/apply_api.py
flashinfer_bench/apply/config.py
flashinfer_bench/apply/key.py
flashinfer_bench/apply/presets.py
flashinfer_bench/apply/runtime.py
flashinfer_bench/apply/table.py
flashinfer_bench/bench/__init__.py
flashinfer_bench/bench/benchmark.py
flashinfer_bench/bench/config.py
flashinfer_bench/bench/timing.py
flashinfer_bench/bench/utils.py
flashinfer_bench/bench/evaluators/__init__.py
flashinfer_bench/bench/evaluators/default.py
flashinfer_bench/bench/evaluators/evaluator.py
flashinfer_bench/bench/evaluators/lowbit.py
flashinfer_bench/bench/evaluators/registry.py
flashinfer_bench/bench/evaluators/sampling.py
flashinfer_bench/bench/evaluators/utils.py
flashinfer_bench/bench/runner/__init__.py
flashinfer_bench/bench/runner/isolated_runner.py
flashinfer_bench/bench/runner/persistent_runner.py
flashinfer_bench/bench/runner/runner.py
flashinfer_bench/cli/__init__.py
flashinfer_bench/cli/main.py
flashinfer_bench/compile/__init__.py
flashinfer_bench/compile/builder.py
flashinfer_bench/compile/registry.py
flashinfer_bench/compile/runnable.py
flashinfer_bench/compile/utils.py
flashinfer_bench/compile/builders/__init__.py
flashinfer_bench/compile/builders/python_builder.py
flashinfer_bench/compile/builders/tilelang_builder.py
flashinfer_bench/compile/builders/torch_builder.py
flashinfer_bench/compile/builders/triton_builder.py
flashinfer_bench/compile/builders/tvm_ffi_builder.py
flashinfer_bench/data/__init__.py
flashinfer_bench/data/definition.py
flashinfer_bench/data/json_utils.py
flashinfer_bench/data/solution.py
flashinfer_bench/data/trace.py
flashinfer_bench/data/trace_set.py
flashinfer_bench/data/utils.py
flashinfer_bench/data/workload.py
flashinfer_bench/integration/__init__.py
flashinfer_bench/integration/patch_manager.py
flashinfer_bench/integration/utils.py
flashinfer_bench/integration/flashinfer/__init__.py
flashinfer_bench/integration/flashinfer/common.py
flashinfer_bench/integration/flashinfer/adapters/__init__.py
flashinfer_bench/integration/flashinfer/adapters/gqa_paged_decode.py
flashinfer_bench/integration/flashinfer/adapters/gqa_paged_prefill.py
flashinfer_bench/integration/flashinfer/adapters/linear.py
flashinfer_bench/integration/flashinfer/adapters/mla_paged.py
flashinfer_bench/integration/flashinfer/adapters/ragged_prefill.py
flashinfer_bench/integration/flashinfer/adapters/rmsnorm.py
flashinfer_bench/tracing/__init__.py
flashinfer_bench/tracing/config.py
flashinfer_bench/tracing/policy.py
flashinfer_bench/tracing/presets.py
flashinfer_bench/tracing/runtime.py
flashinfer_bench/tracing/tracing.py
flashinfer_bench/tracing/workload_entry.py
flashinfer_trace/README.md
flashinfer_trace/definition.md
flashinfer_trace/solution.md
flashinfer_trace/trace.md
flashinfer_trace/definitions/dsa_paged/dsa_sparse_attention_h16_ckv512_kpe64_topk2048_ps1.json
flashinfer_trace/definitions/dsa_paged/dsa_sparse_attention_h16_ckv512_kpe64_topk2048_ps64.json
flashinfer_trace/definitions/dsa_paged/dsa_topk_indexer_fp8_h64_d128_topk2048_ps64.json
flashinfer_trace/definitions/gdn/gdn_decode_qk4_v8_d128_k_last.json
flashinfer_trace/definitions/gdn/gdn_decode_qk8_v16_d128_k_last.json
flashinfer_trace/definitions/gdn/gdn_prefill_qk4_v8_d128_k_last.json
flashinfer_trace/definitions/gdn/gdn_prefill_qk8_v16_d128_k_last.json
flashinfer_trace/definitions/gemm/gemm_n128_k2048.json
flashinfer_trace/definitions/gemm/gemm_n2048_k4096.json
flashinfer_trace/definitions/gemm/gemm_n256_k7168.json
flashinfer_trace/definitions/gemm/gemm_n28672_k4096.json
flashinfer_trace/definitions/gemm/gemm_n4096_k14336.json
flashinfer_trace/definitions/gemm/gemm_n4096_k4096.json
flashinfer_trace/definitions/gemm/gemm_n5120_k2048.json
flashinfer_trace/definitions/gemm/gemm_n6144_k4096.json
flashinfer_trace/definitions/gqa_paged/gqa_paged_decode_h32_kv4_d128_ps1.json
flashinfer_trace/definitions/gqa_paged/gqa_paged_decode_h32_kv4_d128_ps64.json
flashinfer_trace/definitions/gqa_paged/gqa_paged_decode_h32_kv8_d128_ps1.json
flashinfer_trace/definitions/gqa_paged/gqa_paged_decode_h32_kv8_d128_ps64.json
flashinfer_trace/definitions/gqa_paged/gqa_paged_prefill_causal_h32_kv4_d128_ps1.json
flashinfer_trace/definitions/gqa_paged/gqa_paged_prefill_causal_h32_kv4_d128_ps64.json
flashinfer_trace/definitions/gqa_paged/gqa_paged_prefill_causal_h32_kv8_d128_ps1.json
flashinfer_trace/definitions/gqa_paged/gqa_paged_prefill_causal_h32_kv8_d128_ps64.json
flashinfer_trace/definitions/gqa_ragged/gqa_ragged_prefill_causal_h32_kv4_d128.json
flashinfer_trace/definitions/gqa_ragged/gqa_ragged_prefill_causal_h32_kv8_d128.json
flashinfer_trace/definitions/mla_paged/mla_paged_decode_h16_ckv512_kpe64_ps1.json
flashinfer_trace/definitions/mla_paged/mla_paged_decode_h16_ckv512_kpe64_ps64.json
flashinfer_trace/definitions/mla_paged/mla_paged_prefill_causal_h16_ckv512_kpe64_ps1.json
flashinfer_trace/definitions/mla_paged/mla_paged_prefill_causal_h16_ckv512_kpe64_ps64.json
flashinfer_trace/definitions/moe/moe_fp8_block_scale_ds_routing_topk8_ng8_kg4_e32_h7168_i2048.json
flashinfer_trace/definitions/rmsnorm/fused_add_rmsnorm_h2048.json
flashinfer_trace/definitions/rmsnorm/fused_add_rmsnorm_h4096.json
flashinfer_trace/definitions/rmsnorm/fused_add_rmsnorm_h7168.json
flashinfer_trace/definitions/rmsnorm/rmsnorm_h128.json
flashinfer_trace/definitions/rmsnorm/rmsnorm_h1536.json
flashinfer_trace/definitions/rmsnorm/rmsnorm_h2048.json
flashinfer_trace/definitions/rmsnorm/rmsnorm_h4096.json
flashinfer_trace/definitions/rmsnorm/rmsnorm_h512.json
flashinfer_trace/definitions/rmsnorm/rmsnorm_h7168.json
flashinfer_trace/definitions/sampling/top_k_sampling_from_probs_v128256.json
flashinfer_trace/definitions/sampling/top_k_sampling_from_probs_v129280.json
flashinfer_trace/definitions/sampling/top_k_sampling_from_probs_v151936.json
flashinfer_trace/definitions/sampling/top_k_top_p_sampling_from_probs_v128256.json
flashinfer_trace/definitions/sampling/top_k_top_p_sampling_from_probs_v129280.json
flashinfer_trace/definitions/sampling/top_k_top_p_sampling_from_probs_v151936.json
flashinfer_trace/definitions/sampling/top_p_sampling_from_probs_v128256.json
flashinfer_trace/definitions/sampling/top_p_sampling_from_probs_v129280.json
flashinfer_trace/definitions/sampling/top_p_sampling_from_probs_v151936.json
flashinfer_trace/tests/references/test_dsa_sparse_attention_h16_ckv512_kpe64_topk256_ps1.py
flashinfer_trace/tests/references/test_dsa_sparse_attention_h16_ckv512_kpe64_topk256_ps64.py
flashinfer_trace/tests/references/test_dsa_vs_definition_reference.py
flashinfer_trace/tests/references/test_gdn_decode_qk4_v8_d128_k_last.py
flashinfer_trace/tests/references/test_gdn_decode_qk8_v16_d128_k_last.py
flashinfer_trace/tests/references/test_gdn_prefill_qk4_v8_d128_k_last.py
flashinfer_trace/tests/references/test_gdn_prefill_qk8_v16_d128_k_last.py
flashinfer_trace/tests/references/test_gqa_paged_decode_h32_kv4_d128_ps1.py
flashinfer_trace/tests/references/test_gqa_paged_decode_h32_kv4_d128_ps64.py
flashinfer_trace/tests/references/test_gqa_paged_decode_h32_kv8_d128_ps1.py
flashinfer_trace/tests/references/test_gqa_paged_decode_h32_kv8_d128_ps64.py
flashinfer_trace/tests/references/test_gqa_paged_prefill_h32_kv4_d128_ps1.py
flashinfer_trace/tests/references/test_gqa_paged_prefill_h32_kv4_d128_ps64.py
flashinfer_trace/tests/references/test_gqa_paged_prefill_h32_kv8_d128_ps1.py
flashinfer_trace/tests/references/test_gqa_paged_prefill_h32_kv8_d128_ps64.py
flashinfer_trace/tests/references/test_gqa_ragged_prefill_h32_kv4_d128.py
flashinfer_trace/tests/references/test_gqa_ragged_prefill_h32_kv8_d128.py
flashinfer_trace/tests/references/test_mla_paged_decode_h16_ckv512_kpe64_ps1.py
flashinfer_trace/tests/references/test_mla_paged_decode_h16_ckv512_kpe64_ps64.py
flashinfer_trace/tests/references/test_mla_paged_prefill_h16_ckv512_kpe64_ps1.py
flashinfer_trace/tests/references/test_mla_paged_prefill_h16_ckv512_kpe64_ps64.py
flashinfer_trace/tests/references/test_moe_fp8_block_scale_ds_routing_topk8_ng8_kg4_e32_h7168_i2048.py
flashinfer_trace/tests/references/test_rmsnorm_h128.py
flashinfer_trace/tests/references/test_rmsnorm_h2048.py
flashinfer_trace/tests/references/test_rmsnorm_h4096.py
flashinfer_trace/tests/references/test_rmsnorm_h7168.py
flashinfer_trace/tests/references/test_top_k_sampling_from_probs.py
flashinfer_trace/tests/references/test_top_k_top_p_sampling_from_probs.py
flashinfer_trace/tests/references/test_top_p_sampling_from_probs.py
flashinfer_trace/workloads/gemm/gemm_n128_k2048.jsonl
flashinfer_trace/workloads/gemm/gemm_n2048_k4096.jsonl
flashinfer_trace/workloads/gemm/gemm_n256_k7168.jsonl
flashinfer_trace/workloads/gemm/gemm_n28672_k4096.jsonl
flashinfer_trace/workloads/gemm/gemm_n4096_k14336.jsonl
flashinfer_trace/workloads/gemm/gemm_n4096_k4096.jsonl
flashinfer_trace/workloads/gemm/gemm_n5120_k2048.jsonl
flashinfer_trace/workloads/gemm/gemm_n6144_k4096.jsonl
flashinfer_trace/workloads/gqa_paged/gqa_paged_decode_h32_kv4_d128_ps1.jsonl
flashinfer_trace/workloads/gqa_paged/gqa_paged_decode_h32_kv8_d128_ps1.jsonl
flashinfer_trace/workloads/gqa_paged/gqa_paged_prefill_causal_h32_kv4_d128_ps1.jsonl
flashinfer_trace/workloads/gqa_paged/gqa_paged_prefill_causal_h32_kv8_d128_ps1.jsonl
flashinfer_trace/workloads/gqa_ragged/gqa_ragged_prefill_causal_h32_kv4_d128.jsonl
flashinfer_trace/workloads/gqa_ragged/gqa_ragged_prefill_causal_h32_kv8_d128.jsonl
flashinfer_trace/workloads/mla_paged/mla_paged_decode_h16_ckv512_kpe64_ps1.jsonl
flashinfer_trace/workloads/mla_paged/mla_paged_prefill_causal_h16_ckv512_kpe64_ps1.jsonl
flashinfer_trace/workloads/moe/moe_fp8_block_scale_ds_routing_topk8_ng8_kg4_e32_h7168_i2048.jsonl
flashinfer_trace/workloads/rmsnorm/fused_add_rmsnorm_h2048.jsonl
flashinfer_trace/workloads/rmsnorm/fused_add_rmsnorm_h4096.jsonl
flashinfer_trace/workloads/rmsnorm/fused_add_rmsnorm_h7168.jsonl
flashinfer_trace/workloads/rmsnorm/rmsnorm_h128.jsonl
flashinfer_trace/workloads/rmsnorm/rmsnorm_h1536.jsonl
flashinfer_trace/workloads/rmsnorm/rmsnorm_h2048.jsonl
flashinfer_trace/workloads/rmsnorm/rmsnorm_h4096.jsonl
flashinfer_trace/workloads/rmsnorm/rmsnorm_h512.jsonl
flashinfer_trace/workloads/rmsnorm/rmsnorm_h7168.jsonl
licenses/cutlass.LICENSE.txt
scripts/linting.sh
tests/__init__.py
tests/conftest.py
tests/test_logging.py
tests/agent/__init__.py
tests/agent/test_prompt.py
tests/apply/__init__.py
tests/apply/test_api.py
tests/apply/test_config.py
tests/apply/test_key.py
tests/apply/test_runtime.py
tests/apply/test_table.py
tests/bench/__init__.py
tests/bench/test_benchmark.py
tests/bench/test_benchmark_config.py
tests/bench/test_evaluator.py
tests/bench/test_isolated_runner.py
tests/bench/test_persistent_runner.py
tests/compile/__init__.py
tests/compile/test_builder.py
tests/compile/test_python_builder.py
tests/compile/test_runnable.py
tests/compile/test_tilelang_builder.py
tests/compile/test_torch_builder.py
tests/compile/test_triton_builder.py
tests/compile/test_tvm_ffi_builder.py
tests/compile/test_utils.py
tests/data/__init__.py
tests/data/test_definition.py
tests/data/test_load_dump_schema.py
tests/data/test_read_traces.py
tests/data/test_solution.py
tests/data/test_trace.py
tests/data/test_trace_set.py
tests/flashinfer_trace/__init__.py
tests/flashinfer_trace/test_resources.py
tests/integration/__init__.py
tests/integration/test_patch_manager.py
tests/integration/test_utils.py
tests/integration/flashinfer/__init__.py
tests/integration/flashinfer/test_common.py
tests/integration/flashinfer/test_gqa_paged_decode.py
tests/integration/flashinfer/test_gqa_paged_prefill.py
tests/integration/flashinfer/test_mla_paged.py
tests/integration/flashinfer/test_ragged_prefill.py
tests/integration/flashinfer/test_rmsnorm.py
tests/integration/samplemods/__init__.py
tests/integration/samplemods/pm_dummy.py
tests/tracing/__init__.py
tests/tracing/test_config.py
tests/tracing/test_presets.py
tests/tracing/test_runtime.py
web/.gitignore
web/README.md
web/package.json
web/pnpm-lock.yaml
web/pnpm-workspace.yaml
web/turbo.json
web/apps/docs/content
web/apps/docs/gen_api_docs.sh
web/apps/docs/mdx-components.js
web/apps/docs/next.config.ts
web/apps/docs/package.json
web/apps/docs/postcss.config.js
web/apps/docs/tsconfig.json
web/apps/docs/app/globals.css
web/apps/docs/app/layout.jsx
web/apps/docs/app/[[...mdxPath]]/page.jsx
web/apps/web/.eslintrc.json
web/apps/web/microfrontends.json.disabled
web/apps/web/middleware.ts
web/apps/web/next.config.ts
web/apps/web/package.json
web/apps/web/postcss.config.js
web/apps/web/tsconfig.json
web/apps/web/app/globals.css
web/apps/web/app/icon.png
web/apps/web/app/kernels.tsx
web/apps/web/app/layout.tsx
web/apps/web/app/models.tsx
web/apps/web/app/page.tsx
web/apps/web/app/kernels/[name]/axes-sig.tsx
web/apps/web/app/kernels/[name]/constraints.tsx
web/apps/web/app/kernels/[name]/header.tsx
web/apps/web/app/kernels/[name]/page.tsx
web/apps/web/app/kernels/[name]/reference.tsx
web/apps/web/app/kernels/[name]/solutions-list.tsx
web/apps/web/app/kernels/[name]/solutions-types.ts
web/apps/web/app/kernels/[name]/solutions.tsx
web/apps/web/app/leaderboard/client.tsx
web/apps/web/app/leaderboard/section.tsx
web/apps/web/app/models/page.tsx
web/apps/web/app/models/[id]/arch-overview.tsx
web/apps/web/app/models/[id]/model-tabs.tsx
web/apps/web/app/models/[id]/page.tsx
web/apps/web/app/viewer/page.tsx
web/apps/web/app/viewer/viewer.tsx
web/apps/web/components/fast-p-chart.tsx
web/apps/web/components/fast-p-label.tsx
web/apps/web/components/model-card.tsx
web/apps/web/components/layout/footer.tsx
web/apps/web/components/layout/header.tsx
web/apps/web/data/baselines.ts
web/apps/web/data/models.ts
web/apps/web/lib/analytics.ts
web/apps/web/lib/data-loader.ts
web/apps/web/lib/model-utils.ts
web/apps/web/lib/utils.ts
web/apps/web/lib/schemas/index.ts
web/apps/web/lib/schemas/model.ts
web/apps/web/lib/schemas/trace.ts
web/apps/web/scripts/prebuild.mjs
web/packages/config/package.json
web/packages/config/tsconfig.json
web/packages/config/src/index.ts
web/packages/ui/package.json
web/packages/ui/tsconfig.json
web/packages/ui/src/index.ts
web/packages/ui/src/brand/Logo.tsx
web/packages/ui/src/brand/fib-black-bg.png
web/packages/ui/src/brand/fib-white-bg.png
web/packages/ui/src/brand/fib_logo.png
web/packages/ui/src/brand/fib_mark.png
web/packages/ui/src/components/alert.tsx
web/packages/ui/src/components/avatar.tsx
web/packages/ui/src/components/badge.tsx
web/packages/ui/src/components/button.tsx
web/packages/ui/src/components/card.tsx
web/packages/ui/src/components/dropdown-menu.tsx
web/packages/ui/src/components/hover-card.tsx
web/packages/ui/src/components/input.tsx
web/packages/ui/src/components/label.tsx
web/packages/ui/src/components/progress-circle.tsx
web/packages/ui/src/components/select.tsx
web/packages/ui/src/components/site-footer.tsx
web/packages/ui/src/components/site-header.tsx
web/packages/ui/src/components/table.tsx
web/packages/ui/src/components/tabs.tsx
web/packages/ui/src/components/textarea.tsx
web/packages/ui/src/components/toaster.tsx
web/packages/ui/src/providers/Providers.tsx
web/packages/utils/package.json
web/packages/utils/tsconfig.json
web/packages/utils/src/index.ts