diff --git a/examples/inference/README.md b/examples/inference/README.md new file mode 100644 index 0000000..695f04b --- /dev/null +++ b/examples/inference/README.md @@ -0,0 +1,2 @@ +# Example of LLM inference using FlashAttention +