From bf81e39d833fb7ac21c6ea83962f66503518b992 Mon Sep 17 00:00:00 2001 From: longfei li Date: Mon, 18 Nov 2024 22:13:43 +0800 Subject: [PATCH] =?UTF-8?q?=E7=AE=80=E5=8D=95=E4=BF=AE=E6=94=B9=E4=B8=80?= =?UTF-8?q?=E4=B8=8B=E3=80=82?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- csrc/max.cu | 5 ++++- csrc/md.cu | 3 +++ test | Bin 16480 -> 0 bytes 3 files changed, 7 insertions(+), 1 deletion(-) delete mode 100755 test diff --git a/csrc/max.cu b/csrc/max.cu index 344b62a..8f2f15a 100644 --- a/csrc/max.cu +++ b/csrc/max.cu @@ -81,7 +81,7 @@ __global__ void test_cute_tensor_kernel() Stride<_32, _2>{}); Layout smem_layout = make_layout(make_shape(Int<4>{}, Int<8>{})); __shared__ float smem[decltype(cosize(smem_layout))::value]; // (static-only allocation) - // printf("smem size is :%d\n", decltype(cosize(smem_layout))::value); + printf("smem size is :%d\n", decltype(cosize(smem_layout))::value); Tensor stensor = make_tensor(make_smem_ptr(smem), smem_layout); printf("tensor size is: %d, ind size is: %d, rmem size is: %d , rmem4x8 is: %d, smem size is: %d\n", bool_tensor.size(), @@ -92,7 +92,10 @@ __global__ void test_cute_tensor_kernel() TiledCopy copyA = make_tiled_copy(Copy_Atom, float>{}, // Atom: Copy TAs as if they were uint128_t Layout>{}, // Thr layout 32x8 m-major Layout>{}); // Val layout 4x1 m-major + printf("stensor size 1 is %d\n", cute::size<1>(stensor)); +#if 0 print_latex(copyA); +#endif } // template diff --git a/csrc/md.cu b/csrc/md.cu index 7f62793..809df94 100644 --- a/csrc/md.cu +++ b/csrc/md.cu @@ -5,6 +5,9 @@ #include #include +__device__ void mm_device(const float *src) +{ +} __global__ void md_mm_kernel(const float *src, int stride_a, int stride_b, int stride_c, int thread_num) { int batch_idx = blockIdx.x; diff --git a/test b/test deleted file mode 100755 index c1aeb719b1b4222107590498de4b52f086228556..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 16480 zcmeHOYiu0V6~5~SaY_<9fJOcCWFLSaIl*zATiagmg2lh zU8>FjU#Br6j~N1~DR0(P(gwzBLCJ0fRTiKZ8(0aI77``9Y9+=2gevX_+0~N~^FjK3 zZl_R@d-0-Vj1tvnk9Lv*icr5DX3LMaB7kz;P^f82$gs@!H)9s-xj&d z!yK>Lb=b@K6v~%Vt;=RcyE@lpQ?1!dt~Av;)!o(F)oB&;R)=l^wJVB)#?+>*+v#%5 z5+;|kX4>%Lk7O6Hob-FH+3>4ZrhoF}t5?>)H#^+%yJv3d*+DwgZn7aAD&$WtIq_6K z7YFH>d_1J2Qd!3V0~)ZZwMV4?m+ zgCO{8s^I&8FVwF$fM13qSY8FNT(ziJ%t)FjAQju*HIdKRMb{~~wyo^JZCmVAx{%(L zDZ1&xwk>_xd@jAs8O^4RY+=bQTSxNQVmzblTSnZ@bS{-0Opdti?a6VcV7mn;;}!># z@%S*X^`lNPleF_iw~%%w2DjPU+U)p97ed2{+nvc5ZD^!B2Xh&>zde4N#>x56!0zx$^VJUPS|qR*&!HNe=`W)HYBjI3tNA+QTCTgh=Bs!V z)v8N4{}Je(&vLRj^w8Ha%!E>4<}zzW_`GM?uaC$VFtnsgc%4k5N06E!2eqY z-fg_}--$gZ8WQ{Jf4xqr#Qn2wP5Jf2o}V>5ue(ydwgC84`N|?l<0?h^<0LsX_lI)1 zd_eOw0Xj8z#N%n=b87Ce$J4~))Z7n+hqo=-Tffr&z+V#Jn*;pP0AKIt+y62+bL5MO znYR*q{&;d|TfBX?{pG~|jjteTx%pj7slSa`jjQehiw^GJxDvLB{q^S&`OImz8C`z^ zO4Rkm<)e+Orb+L4rqG`w;r?siBC_U8V&-Jx@Y~lX4xg?~L|#Z7Ipbac2amCXhVs#| z##QK-*i(L{Hy%SQRa(0}v1j8jG*x2en7bsgZ{q`Cj?bMbmyf5AoEPe!fnMZR*jCuj z-3}o++73Hhtfpsa=7%oaLs4g5JpLzmNbGA?ntg+iCxJW*CDOW?wGJDt-{6;p#EjPZ z3Td&g^{n+xqjhLrD+A;y^7Zob{zlB)_5Muh^q#xkkCZmtd)Mi589nSkxcAsmFFD#@ z|EPBKQ`B?-wHsnEq;CWlpDdSM&@AX9pm&1OH@&Ap zzX1B!JLNKcJG=T+xqJe28gvO>+34FQmB<~#Dl*j+xoF9vh69Y#H~by2Urh@Ai|Esj zx&lWhj)Q+Km+70NTGlkMY{dW`V~* zrBJK~aU4Os`w5IMYkHujZ|ONTccMk;AE58y=t4g}S0Ufx$zKJYg?y!7KBUEjgeA;C zn1L_@VFtnsgc%4k5N06EK$w9r10N{^vQACbrO7%p`uatM*2qy2p4P-sSz?H{j(I8b z2YG#)erEwD>*6kAxx72IFfZ%i=zWNatUdetnR1@^CwQ@#tO0A{imd&5ljX7oEynGW zHF7J+2}-je-kHtR0bWlgYvgva2EEr&ku`D`8de=;K=4^^h_pM(@nx-?#J`m7Men_` z=^xZJgpZWEzmx0_-yJnC?ZRuM=7(7RFXrpm@Bf;3>%0Sw+xP;;m<}=BDHk@N|54e7 zn6cQ@*LPj?s_mntoLh>vw_BZ7TWfnsv+Z|xbXaYjYZ(6U2y{8>)I0c~TUqG(L?C&P z2SSv^=YuY!PuH&ot3^)+`bl<#M|u4wSY6iROt{=n468v@B3SP`)MF4HE{axJN7N^k z+z+CECo1Ge?o+|{YW-&K{u2CgR2FLg543)Zx+xHsKF*VWi|s7XDJF=aH{iyJ z0#^Zi5cJXAFJYDjU)?hyOqbv zb7wSTyUs2Jpy-yy#;l~8UvO``6Lyl8+!vvl%G(879f*g4?jQrIwn)%>NT=G!vZ1+Z!JjlDgaVNx2k2W?(*KQP?0 zC2q&J_R~HC8#_Mic)~VdqJLP~{Wovz*)rJYS>HG?FcQc9fS%sXaag2Nj_Y6(!i{K1 zDwDHI#dHdO{44!qvPz$p=70RH2*wRB{KsV|=IwEGleR!mauGDJpTLWY-2tXWW@~|m zoA#JZ60(n>GK$HwjSUx)A=*hnyBR9=Y|4V!%7B#QC8NMnT`gXWxKUu|C<=~9t-rs43N0TsV}aDN?r z2k{sAzbF{ZTm1GiZxR|6MW#Xf&jbGl=B(0wnb!-witTuMdsh1$$Z1Y5_A>7m+D*wt zp*B)g`Y-eE3^1DNiM_l>2#v8lRCEcj>PtXrPA>K`4;L!$Gtz$16M8r7X^t=aBr6IX zGGVeu|3tuknhk`;#E_}@6Z)fo z{VWTF{+{zMZp2Rb=K}UJ4-_iz&!Qi^e}2yP-rOn5noNWG!V7(k?PdJbi5=5^$o)m^ z1p6&2)J3sRM2$q~3B!7489xFXLuDBbdGD6r1!O;LFkfOX^c~nX`t0RBX>Th)6wx!> zJTExS<7w-ICQRbTVn))$_AAJ_uf%+HsxIgFtnNw0eyxX?in#Mrx%Ph57(49d0don2 q^jnLxU!FgUfl1r__EVjPTO1HdT+yZ1uYigc-TP^y(GoBSu