From 30e1c3171e5b4508210594b7a6cf1af079f1026e Mon Sep 17 00:00:00 2001 From: josc146 Date: Wed, 25 Oct 2023 22:39:20 +0800 Subject: [PATCH] update kernel (CUDA Compute Capability 5.3) --- backend-python/rwkv_pip/beta/wkv_cuda.pyd | Bin 640512 -> 640512 bytes backend-python/rwkv_pip/rwkv5.pyd | Bin 404992 -> 404992 bytes backend-python/rwkv_pip/wkv_cuda.pyd | Bin 475136 -> 475136 bytes 3 files changed, 0 insertions(+), 0 deletions(-) diff --git a/backend-python/rwkv_pip/beta/wkv_cuda.pyd b/backend-python/rwkv_pip/beta/wkv_cuda.pyd index 7f12a48b8eb68c1c49ab79dcafc6bf2bb9e88e9a..7734f12573204cd6497cf1c18656286f9d4abcec 100644 GIT binary patch delta 4260 zcmeHKYiv}<6+U}kGqc{i_wKIoF2?a17qP`r9Yf@`+azT{3QmNxfFeOFZxxguyb`KV z(vlxdy)A7_qX=9z>9ryiT+(1ysR%?>uV@n>gaScrL=dVeYEvE(j+)|hDcFf>);(ut zHcg{Os?@(->1wodX3pa~-#If=ekNCbCU@Yo5##Ze?QM~Pwg`O&ekOhves$y>>#vM;kQ{xM;XBIxry1crXm0fx*K82 zE3=`}H3n7qMHW2hg0lH&o@H>}e5B8V?{5JpT&{SnRX891au;u8{T0?)Ega8sXw2E= zekck#`YYU24gl`!zQK-G;k#K#q{fwz#sD(V(dW$?i9p#e-DEA*!nrIoHYz8;Q~Mfc zqn!JtirycGlQypJ^-x}LKgh?tF&pKry_4j?`7A_XL@ucFLK5@>49NeJ;g*2++y6_{ z+ddX`{>S`8!~h7YyLodGV6^19J&|&HZE3EPrup_gyqU)09^OFXx;=cgTsI%apbUd0 z-(iSE_|_hNm=uLOf5KZ$iR04$fMYb3{x=-sDV;2hqx&g1#$2`UlQ=?5;pn2AaIAAb zfg_J89EGcJjKwsL!KxSe)~JkFNAM!wYoOzpU}Q^LvnLi~cG+y{WwEYE+1%K73lm&E zPHf^&5{^ddBnFf$Su;4Yp3)7J0}`ON-!-~W4whw&&&-I^pZ|!Bu3{mx6f2R9$dp3x z{wTjDy{dCU+!tQ`8J{l`6n}}gOW=+AH4*T?guqYHg5pd3TM;Q(ghWT~LfjcA!834+`55hbic@RjCCwzOIZI$z;;&8x7VRsq9@ zx-=S1mYf+JF(Xl|d;D2gn$zL4uka=|cajxkl6+tJl>p_}9G{kc_};t0+lTlO=$OYwGIxU^EQ&TfDGhS1LxPTrx=_v_ADy2NB>A6Jv z5vHWpYgpr|DcF(|bMt?v1%J!}ODVFL&XjBhmZex9cKn*xs~m%~4Q&U-SNU$r>BOr# zXE9&#y%VFik7q5#h0)R+mjE38a@HZ=g7(+=j~XeLv5Z>32-gGlp(baHwS7wC{*&8z+wNO^D;tD(uLDNGcp+$q{U>{t8C4z$RE> zYb9}ceFzz|qpyzSbx?GKN{hsC5HkxoxjxF3o@DYQ4A~uhl0*oT5M7d9ocGw}a;7&L zT|;oCdl&L0f5Aj>%OUoRmTYGYj^T-;yjj-P)z|ra@;-h{c|ZRcZ$pwCqwI0Be!WB9 z8ueX}iFEXVp{!2^TaNKRBZC!5TuqYNvBR(HGOf^Nm&=icCV z&8@J#k}up<{Bd2y7mrImoJ&tz1z98*V*k^+)5TSaf6o(w8ZCY8aO1Ge2`Q^#nAF1fE> zpA(l@VY7_TLhg{l2AvJYWUi4*m=1Cvr5s9Ul!Nv4%D`3az$`<_8yeKSV-FxD{HB}K z|Bq%7jI`7rmVd+VH2Z6H-YQe54|U;<*toE$gXYZBLE$_xCQhg`DAwxS)LF0`#ruTL z-gWJhK)pj&M_(K}R)%%-*-Y{O5?hU^oyu~@Q3a6DsB@u$lM1j{y|{9KF;xgcs30#< zP$=hI1sjj|NOZ#;Z}R04n=TwYIDeYo7C9eIp60)I@Rs$vxA}6T^UkpGEH`e)|F_-J zx2~2EvlXmAbPPbOK^;(JI1;KLw#h5kHCDJ7oV!E3zM7P10{~?_ z3kNS7$S`UFh|FZ~HAKvhu~q%Dcg;3vhn46t&pj7QXX1_dTrTi^dHq>mDh$WRw>s@L+m(#w%Q&VJ(;8M%b`OJY-<|0Pq;D zJFpVvIKmaKiCC*XL!%RgP_~!2KA;fIX(}!OCnK1m5^&Y1I5sH!S@QOb2byOPicqYJ zrg8ed?&!bT({wK?;7s4eK`!)Hcw8ND751>K?lezh^L!+q<;VpbJq&0FE8;^$aP7Ip zNaPXOm%>7)_!@6VSh2%4_!w2og$W_1(5hdG$H_W0U1P&DFr9^*z-Y|P%fpNJh(WXe zAe3dNAoS_o;OZc2-S)5aZb0fVrhMa;;xOLSzD`|0z8f%>sOGrGkjL07>ogUKzi@mH zk0F=@f~Z}F+#L1f@ckuXE8HA;PV3EReA!%PXu+ma2yfjyfOYU2DoNJ6>a4 zUz}waL&z=t5UE|DJx}$L@XY<sTwydRnvI3P*q{A<9;e-vkOb~(Yz_;SjxIwkhs$iQ?p1jUCT_> zvVkuiVs7oKU^!H#@{Ex0bw}Pv>0;DUU2-mKF*YFUDsHQF+*TY?FXiyW)8cujrFILm zZKAnfLSm7ZO*tE*qM9%NKup`n$|nQG($j(XPMlb~PqXxeed5g|PHaA;7X0dvSQh&y DQ)@eC delta 4260 zcmeHKeT-CB6+iFu-aB9K&CIeh4BMRr3Da)lcA;T+wMB-;vTb%cfK5QNV`6JY=Y7bYEO2haFI8_P~Rp7BWc z`wZsbQXX=E->k2)aKW?&a7Tv&-`)jK92<3Te_!y6gFMHoqilEv`tks|g5_1AEad2} z%jJB?LTmRF8<57F1%n!RZY7sf%D^cAzylqBW~2;_EkrqYD+w5}a9znkc`^RaHmM(- zjX4)Bl$RnfDCJQnpzkH6DO6DGMF*fq3gT&{IGLW1UXKU6d|tKwm#FvL6m{DV`B_c( zG=J_eZ%ldGP{oONYF=h@WwD*1`Idg(NMpI5*VDMApKp}wmcd2vpts`MO!Kth^?rVm z6a@!<#FrQ{kNStmWBisp#^Ra(m`8|>sC1zG<~&B@DvvxiDCHu4OCDpf9w~^VmEuHN z6>Qw!@EqSAkr9UxJjb8WtJm4UEDU3TV$AZ4rV@*_Yo4*aI}@U3mNm`5p*%RiAE!L( z=@E1|RWavrWStcWkTZFR>+LuXrfE*h&x>;(bK(k(e+$vbOoh^#UPL1ny6C?%#IH%O zqILk7&ha1fWwJnt=Xr}vyk56S1NYOI_-R^Dex83_lY$kfx`?I|_5=yu{0Z)qsv7JO zERml$%G;=fYmf3LX?*=CZ=rE699v#cC0_diKP>k(+7q;I66c#KQH>lih?X(NS@?2; znX?B`K2+g)4~FVC2-`=)e#R)q&aYjcmyre*J@)5;UwoRFA&kK{-Oj@7OhE3GhM z*waJ?i%X*+*i3UoZm1bfg$@L*zv6YO#$fNE+?P-A!&KAB6JgC_Zjao$5>;7e@}|PV zP-Rh^5;*Xgygf}dZh47+KS#BUW!3r>WExqs!M;fHH(%mkB)#R6AqwLOjLF?r39)tH zB%dSsfl~@YM@}i)ID3lks9vEWA*YFy$^#=fASv>?0J27FH-;%m)fTD@00k+JaJ9ac z$7pKM@}f|V(O7lY3DGX$G{(Fc_(2{x@3cHGTS}!ypwDXUjzl(59y6uoe9d1G8r-xC zn53bKWpAPmIXlc7Wp9nY%$Je(iPOsaWv6*Ff@FA(HW_tWZL+4wXqtM)2VKtxs1g01oxv*qZn8>6b?{$zF#$vazd zU0)tU=`32ZpzXa-j{BfbZ|zPcmEL4h>7zF=%1SmuO?JXli4YiUyA_3Hek? zDYmRmi#p#VI@F>3R%oCuq+!NniAw3TG9b@SbWq3jS#+STPU)!+laAE0Q%0~rR~xcf zmCpKlwNSPUDzGiZNekl{bTn1sh$+gHl%L5%BectJ6R}A17E*wc56=+)XR<2t!2317 z+o)1d9Q%BUEMa)q3kQ>6L0RGxZ8AqCLC1MQjA<*JOPiRq1XY1S*$As4P*0yJ@h_8R zF@=BIR`^dKb7fg;_gieE$|@JiDaI7=g-}Ttr3S#DoP=^98Nz~dl@!dHywxNUow6Fq zu&lwp*Las^Ntu7?9KTKL3$CBzzq9d{^_w?%m)^EK$eri)}zCC{OgdBbZvlg+|&z_jm8-GyYCW9R^u8x6eI?1odGnR zpA>*iDl0WC83@EC;_ouUk+KS6kGzUqW5qH5!d>F!jie+r0N|wnddGBNk_r&;*R`9B z@X$!&RwD^zMBpfmBz*tvR3bYb$~*{9yWvvG_KT!BlgAqJiD>SM+Td)|7}WZr6b zTSp`F#(|w58F1%jYqqu z8H{R=-3tfJ0_-zRcG>1ufA4bf(ArNW2d?U`_QOHD69osl>;x$ss@S&h0Je3kVojgW z|4v=0=1m#pWxNXWzsx(uv3Uk#a3ZK*AwH)QeSpJo|FQKb#}TgZ5HHw$vbppyJHQnY zaU>x8nFw@A)DZ|I?KnDR3riDTxoh1Ia^79%aCM+1!t;vgqa^R@JcA_pNSlBW4QpM= zbF4Xj*AzGyKp!GM8d3P+d{B1rRaCI~!fJ?wd>0f~iZAgNB7`V9>ZkPl||GpL-7J}a`4U?u^1m51w=V@ikdAOa&*@b z_tR-JMGq2eZPUDnP;)Esxbh;-@f#l)Q|yVk;+g#I+?+tbU+jt@cF3B8!4Ws7 zEzfpxiSVLqst3m!_29rTY8Pb@h7$?HxPmDs2cuyaj-xoGJ`5-L?StZL)c+4{P<-(8 z26118_+eYf2X}85y^D(Bg;054YtLHm|CFLcU@G9ApR{WL#Df}t<#D_)8s8GS_Wxf0 zkiGt7&wuH4h7U`k*IKWeVX6(LdR;eFPuF@K&l)O$X@f8KF{52xR%@+l$o1IkVcS^1 zh`te+_sx8skegwu*YiyExQ;I$LN<|stht>*{SR~?h0FK3jW<%d7)_vj&7r)>SdZ-e zgr(MTOUV%v*g3)3r^M5CQ|%pLSpg?eUXq!?pHa43Ai0~_X)IfcmQV1VK&Z` zN0~lW`2g0?59r4mD*8@*Hj~90c;eGaM>PYujR)|81UOR$u(3EWl8V0DQO#3I0DXEL zPT!EAO64d4w~7e_MNB|O352Dy=kOgGyij?Z%0Ge4oGlV34B)j1B`@Jd(-U>F!om3S z0bPKr&~GYS_w4FmI*To^=Z=+*H|zBAJdyZe`B3>8xQabA?(6k_t^k^w2h!Zq{&lR-)F%1Eb*>MFSw)F}U44pv|6$JL z=@N6W_X^`Z0oV!!t1n}(_Nc_|oJk7}QK)>kBGath%B;xk!T-+ZJOAV}^Z)UQd|mnE z1wLaQJ8CKLj|rdWxr}-25}$Z??7HR>qQT&V8{+8h(EwZ=0YwYgPJji_Rg4B8=2Hg{ zpY$E^$zwjTxYsAK6Cs~MgnSwiE`L(-F~L+6Cq&4p2sw4jUHqVk?Ta&$QD*u;ObBm4 z17re>YF-mSZJ(at5w8@F17Ic-3z|zBEX`kXUwYow%#k|Zg)7K^5^-axVW}~Ca9}18 zx3Ao-nU3-T4>c&A$?6K!u>u5sGKu`L?C?5x`UZn$$X|jELhfSV_fkHU*fDiH%$k{b z<`{)a!o)#94oRbmqyYH7ia3&W5JQvvqqxxyCV(3N)c5rS*6StA%qc5@nk7C*2`C1w zZ-11(bCjgk;<`M`EP&POxdds{%8gs{LvjSSE##C6E` zGrfgKZ!Ne9P3Bj@iu87e)Q03L!bt0?<{GPx>OkE#Vn6aMGAE(zMST7d${E%t1zMb0&@~n zp{C}!j}kyUYqfCT`ucBzCqe(@QH3phC!WbRWTDcJ_IaLb`?|EXTEw$;{~6C8+>;Z- U_&4I(BRRvz-faE)NM3mNZxA9W8UO$Q delta 2181 zcmcJRL2MgE6o%i-?0D8|3vWW~b*!p3JzzK>84gJfjc`H8k!%tq5IL;n`hb)RTo6)j z@j|PH14TVl#N2#p%LRoBVR|!CL^)THf=~{1pm7h#N~Mx;Fb?m{?vliTOC%1~)69Es z=goWH{E4@n_O{dOHsec^SH{`uIHMoOpJzqq|pnN_JIo_!@cBudi;1CvomGYxX_sPGG z{-9z-HxTca1)#+aJW;J7U4Zj~1Q@G0co9#$=O%)<-zooT78_(!m#|f1zCCFZ?n9FoTqT$A19LMXa=-vyoaw6005-4y<*!YJe$TFQj0e-M z{-G}D3mRr#=b31W?9VA~^dz>*uI$hZH#i9MKw?70Fz%znuEejWZ4lRQNql0JdJi9ULv$=Ch*UKB60LWX*b= z66a>VSd&S1wVhg%+Y@KxGj*EJH;B(<%K0DoM11~>&u#+8e}nKk$z{mnUo<_9pU)*u zU2_S+duZtH=@&Syu~5VvzA%7gpzfvuK2`7lv>*B8BYXk`eDZ)#@?%`crw~4$Lil`& zQ9i?pBqbuB`T#7%=kryZTwe1T0e^}{z+*Um9`G8CEC+m+G@twGHI0`M?MctuD$6Kh z$PyW8D8#SvpsxcqIhax8^5d;?G>ZH&Co^GEz-FIX$Y=!gVdT!#GlqFHwaC&2@rQWb zM8Am-0{IhYiN88_ka)%ytRE2VrxC{xLzCk3_`xUY6XFw~-qSCxUN2!G>53AlRpJ9Y zpg3sX{8~Qd++*#PZ{&GqdF)R0xrl=sYq##ocgZolE5EhR$n)fBp67_?_@twCHPqWZ z=fduBy-fvFgu07*i@c#+g#tXPyItiC;Ahm!Kz~QMCbc5H4fQwV+8WVYUw?Bh1bS=1 zZD_G$dJC4Xw;CgoyMSxNN$V{DP6PQqE6!<-IId6fTknm_Prcm!<)M83&A$Oz4;_L4 diff --git a/backend-python/rwkv_pip/wkv_cuda.pyd b/backend-python/rwkv_pip/wkv_cuda.pyd index 11557cd871b2ae2377724d2225f51ece4280f5e3..2b8bc6f09b8f6ab8f5808a8dc4fdd59c9fee5807 100644 GIT binary patch delta 2472 zcmbuBU1%It6vxkeojbGH*_r)FcDhZo$x>2UFl<}0iS#8FnpC=M5usIfl|EU&Dip=~ zq8Y6;^`#X2m^_tGB*~+KIB!~{G{ujCSZp*}iD**NHnQ3z{oM83duNM^KDn@5cFsNL zp7TGyduDxqgYR$npj%OQ_Z%%KV+DnORr+f5)x&~fyfI9+vB?o5oE*VpPb&Sv1C#iu z)^GHOMh87En*d<<;0<=B0dM9Z znO>BK6b$8`_+Z8_ED<;`eHJ_!}HG{!i6M{!(@6J3ObT072t>>`DPl*BpC9 z@v{eNJ(%Us`{uBVua!CM;OkR!xKHfsg-hVW$(oCdln5`(;U_#$c;ZJaXhO%G|Dt0o zo&B4RiFDMgNJslWbd1~5@1HtCTjRk1xhV#Zd+G zcv_{zslh}`HlimUXNIqJmsxy3@wI2F_o%`CSx%GrD%Vj>&rm_Bn%<<9jnr^YPQig)xe!=S^t2PYDFI@N)dqsm1i`XZGS2Oz+ za33S#*Z79YBEF^w!!`n)*o6cxa>L~--65MKAnnwCWl^9qCT?Q8giva2Qc`bh3%l1aIfAzfA}H@{B~9Djw&t-GWW z-9vC?l84d}kRuS0Yl znO72IUh7@H_14uZ!PhJJDX}miSV%+Gph;40kCJ2rv9BE}aTfTnAQohD*{n#;NUt@U zO{cTYS)hzCyC!5vr)4IsIP=_}WJ*PGReezo1w$~=Q~HB%_#qE0En(4cO$-BFm(+*F zHO$B!10JEXgUU@j#e2GZGwNB~mAv;;^~Tw}E?Jnat+%;=6OZSS=N9zc!uN8#mvK+- z-$wg^=1?bI;`Yn8@C6>Xayz2XPLQAbbS+}*#BFSF`-wY}p~*XPY@EA;&ytQi8*n@i zR!Zs+PfgKqb@wuk1r5PEJ0QR{Ga-0dvD(J%ZBRi=wngZ8k~#~U#QvBmSJ zdmFfgAo+}U&(typk!P!B2EbE_RZ!*WtHI$0{zL>zNbCrb)@z5+M7j@&AlQ7F6O1uQ zFpKd9Y#x*ZzuUweJ#}_k@M7AMAKR9^IHusCR1fM++&C(TvmWNbJbFuTGToTWi7Q1! zLLw%+Xuv`78bh(Vdj)Z1*R3goZfrT}P0ss18_StWc4b=@hEUAB@b*R zU>G9?pBP;*ApA1Xdt#mq9TFAl#10SG5p{zx(Q9If+QAb@%Y?F?OfZv?2P{Mhw5!tI z(IKCsF-AzZohy9)pUIOLSrI?<6}DX)ZQb*NXkqkHx11@1HddmdP3A;J(Q{5rf~(G; z(z@qb)CCBBGV0#pU|KTu$S!5fO*>Dxvw@Cl8zOvaKwSRk< JOR$Ble*!w6fFA$= delta 2472 zcmbtWU2GIp6h8BJ?#y;)XZEMv=~B9FL)t)MQ!wme2uXdQ)v#G&OhB`%;Ys|%glNPU z-BAq1#1M?=?t>wX58XccqVuMGAk=6iF%m%=F^kY@ff`6)fwsGzd+!to@xjE0$<55U z=kNQzd+zxDdf#9FMW3R6)O~nBnHW&`qtc_%qXz?u@!lBOCZ@)XU}_wXJg@AiJ~D+* zYdee`!Qm;qwqfi`=xf3ISx841z~tE_2lC)+ujZK7bbRfV(lUbb)^?JGEBAGL4iM0_eX>YOvkUWhFw&5(9msXwFHU46Ey&{1Qe#H4*>1O;o(9_|?3iwf zvztuHN>qJ8Xz~WP(=c$1yqs7`sSypEd>Hf>8ll*9eO5TEB~F9|1S3sMNsa*zaqNq? z@g(PT>2}Cj)SVEnTPc)rDyvH^OqbW$9KgwEv)JSu58uI0Gn~t)C--mRscCBV;5lx; za0g%Gaf^3D71}ZC$$haLYU|itY;pUsWvQX5WjQuZFXPLVKR8J=)2xKVfpIy|P&88k zc-lyb+7v?-ElC5wkg!Kgxql7Ejzrz?JD?clYsKAdS$QF+i_Bkv&$3{e^r0KGOd-(}Dy@I{sY|XFYAg?~wlGP8ka1)7Srp2AK z)PCgI)KnfkWuyeEtZKe`u!X7?BEQ5l+CyZBoIX zv~hbsDVS#j)0Xl=^5?ueWhSg)0WECwVZBt`DwEH?oElvGy&EfQV$#fc@ec zL$SKMFLGANKkn6Oczb2nt%_?X=}{&FayLRd`9Vz`DJ9}EZagmIai%KpVHR|&ZqSi0 zaL40TUyd2F8@j%P1O&9tXpczc+A5rQ*Mw829Bc)4hk3`k9WKoPs;aipjp}`LTHRZ%)0r5~4 zrYS)o)Wly+EH*CKh=;TWM-8@1F@&vp9@%=O7TiMiGtyty4>sGS<~9eJ7@Obx4`-~6 A5C8xG