flashinfer-ai
diff --git a/‎.gitignore
Lines changed: 1 addition & 0 deletions b/‎.gitignore
Lines changed: 1 addition & 0 deletions
diff --git a/‎README.md
Lines changed: 1 addition & 1 deletion b/‎README.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎csrc/nv_internal/cpp/kernels/quantization.cu
Lines changed: 2 additions & 0 deletions b/‎csrc/nv_internal/cpp/kernels/quantization.cu
Lines changed: 2 additions & 0 deletions
@@ -7,6 +7,7 @@ compile_commands.json
 
 # Generated files
 csrc/generated/
+csrc/nv_internal/tensorrt_llm/cutlass_instantiations/
 docs/generated/
 flashinfer/_build_meta.py
 flashinfer/data/
 
@@ -88,7 +88,7 @@ python -m flashinfer.aot
 # Build AOT wheel
 python -m build --no-isolation --wheel
 # Install AOT wheel
-python -m pip install dist/flashinfer-*.whl
+python -m pip install dist/flashinfer_*.whl
 ```
 
 For more details, refer to the [Install from Source documentation](https://docs.flashinfer.ai/installation.html#install-from-source).
 
@@ -363,5 +363,7 @@ template void invokeBatchedFP4Quantization<__nv_fp8_e4m3, 32>(
     int32_t* SFOuput, bool useUE8M0, int multiProcessorCount, cudaStream_t stream);
 #endif
 
+////////////////////////////////////////////////////////////////////////////////////////////////////
+
 }  // namespace kernels
 }  // namespace tensorrt_llm