// setup.cpp #include #include "matrix_add.h" PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) { m.def("matrix_add", &matrix_add, "FP16 Matrix Add"); }